Command that produces this log: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 ---------------------------------------------------------------------------------------------------- > trainable params: >>> xlmr.embeddings.word_embeddings.weight: torch.Size([250002, 1024]) >>> xlmr.embeddings.position_embeddings.weight: torch.Size([514, 1024]) >>> xlmr.embeddings.token_type_embeddings.weight: torch.Size([1, 1024]) >>> xlmr.embeddings.LayerNorm.weight: torch.Size([1024]) >>> xlmr.embeddings.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.0.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.0.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.0.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.0.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.1.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.1.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.1.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.1.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.2.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.2.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.2.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.2.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.3.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.3.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.3.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.3.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.4.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.4.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.4.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.4.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.5.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.5.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.5.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.5.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.6.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.6.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.6.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.6.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.7.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.7.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.7.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.7.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.8.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.8.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.8.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.8.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.9.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.9.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.9.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.9.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.10.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.10.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.10.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.10.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.11.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.11.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.11.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.11.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.12.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.12.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.12.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.12.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.13.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.13.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.13.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.13.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.14.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.14.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.14.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.14.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.15.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.15.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.15.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.15.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.16.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.16.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.16.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.16.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.17.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.17.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.17.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.17.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.18.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.18.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.18.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.18.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.19.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.19.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.19.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.19.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.20.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.20.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.20.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.20.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.21.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.21.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.21.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.21.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.22.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.22.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.22.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.22.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.23.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.23.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.23.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.23.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.pooler.dense.weight: torch.Size([1024, 1024]) >>> xlmr.pooler.dense.bias: torch.Size([1024]) >>> type_embedding.weight: torch.Size([123, 100]) >>> trans_rep.weight: torch.Size([1024, 1124]) >>> trans_rep.bias: torch.Size([1024]) >>> coref_type_ffn.weight: torch.Size([3, 4096]) >>> coref_type_ffn.bias: torch.Size([3]) n_trainable_params: 561067023, n_nontrainable_params: 0 ---------------------------------------------------------------------------------------------------- ****************************** Epoch: 0 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 04:56:32.639392: step: 4/530, loss: 0.060033295303583145 2023-01-24 04:56:33.666270: step: 8/530, loss: 0.04589977115392685 2023-01-24 04:56:34.705078: step: 12/530, loss: 0.06528154015541077 2023-01-24 04:56:35.740480: step: 16/530, loss: 0.016343357041478157 2023-01-24 04:56:36.777047: step: 20/530, loss: 0.013062904588878155 2023-01-24 04:56:37.808386: step: 24/530, loss: 0.03764989227056503 2023-01-24 04:56:38.853241: step: 28/530, loss: 0.02163952775299549 2023-01-24 04:56:39.916650: step: 32/530, loss: 0.02140868827700615 2023-01-24 04:56:40.959691: step: 36/530, loss: 0.07444584369659424 2023-01-24 04:56:41.982682: step: 40/530, loss: 0.020764824002981186 2023-01-24 04:56:43.025944: step: 44/530, loss: 0.01761607453227043 2023-01-24 04:56:44.061031: step: 48/530, loss: 0.015811558812856674 2023-01-24 04:56:45.112524: step: 52/530, loss: 0.058635350316762924 2023-01-24 04:56:46.157556: step: 56/530, loss: 0.054577723145484924 2023-01-24 04:56:47.226387: step: 60/530, loss: 0.014780597761273384 2023-01-24 04:56:48.265715: step: 64/530, loss: 0.05506347492337227 2023-01-24 04:56:49.300679: step: 68/530, loss: 0.014647278934717178 2023-01-24 04:56:50.325387: step: 72/530, loss: 0.0471046157181263 2023-01-24 04:56:51.363587: step: 76/530, loss: 0.08761477470397949 2023-01-24 04:56:52.418534: step: 80/530, loss: 0.012713438831269741 2023-01-24 04:56:53.463089: step: 84/530, loss: 0.01254933699965477 2023-01-24 04:56:54.519334: step: 88/530, loss: 0.07934611290693283 2023-01-24 04:56:55.551834: step: 92/530, loss: 0.01443867851048708 2023-01-24 04:56:56.593639: step: 96/530, loss: 0.013973497785627842 2023-01-24 04:56:57.641023: step: 100/530, loss: 0.026187509298324585 2023-01-24 04:56:58.679688: step: 104/530, loss: 0.04219330847263336 2023-01-24 04:56:59.722629: step: 108/530, loss: 0.05404404550790787 2023-01-24 04:57:00.756890: step: 112/530, loss: 0.05650760233402252 2023-01-24 04:57:01.806535: step: 116/530, loss: 0.05717125162482262 2023-01-24 04:57:02.850685: step: 120/530, loss: 0.00882972776889801 2023-01-24 04:57:03.903699: step: 124/530, loss: 0.04490215703845024 2023-01-24 04:57:04.942051: step: 128/530, loss: 0.04658155515789986 2023-01-24 04:57:05.999710: step: 132/530, loss: 0.012538946233689785 2023-01-24 04:57:07.038188: step: 136/530, loss: 0.011128903366625309 2023-01-24 04:57:08.087301: step: 140/530, loss: 0.014826716855168343 2023-01-24 04:57:09.145286: step: 144/530, loss: 0.009929697029292583 2023-01-24 04:57:10.201171: step: 148/530, loss: 0.0678681805729866 2023-01-24 04:57:11.253835: step: 152/530, loss: 0.057826437056064606 2023-01-24 04:57:12.284022: step: 156/530, loss: 0.02970445156097412 2023-01-24 04:57:13.340579: step: 160/530, loss: 0.042627204209566116 2023-01-24 04:57:14.381778: step: 164/530, loss: 0.022546298801898956 2023-01-24 04:57:15.430391: step: 168/530, loss: 0.026655809953808784 2023-01-24 04:57:16.464071: step: 172/530, loss: 0.02497207559645176 2023-01-24 04:57:17.506451: step: 176/530, loss: 0.027215199545025826 2023-01-24 04:57:18.562728: step: 180/530, loss: 0.05222507193684578 2023-01-24 04:57:19.593815: step: 184/530, loss: 0.014712275005877018 2023-01-24 04:57:20.640284: step: 188/530, loss: 0.013996199704706669 2023-01-24 04:57:21.711920: step: 192/530, loss: 0.009635187685489655 2023-01-24 04:57:22.766391: step: 196/530, loss: 0.007943525910377502 2023-01-24 04:57:23.804718: step: 200/530, loss: 0.012248823419213295 2023-01-24 04:57:24.843912: step: 204/530, loss: 0.01388395857065916 2023-01-24 04:57:25.892255: step: 208/530, loss: 0.013846492394804955 2023-01-24 04:57:26.941382: step: 212/530, loss: 0.013890700414776802 2023-01-24 04:57:27.978536: step: 216/530, loss: 0.07550472766160965 2023-01-24 04:57:29.026659: step: 220/530, loss: 0.08688770234584808 2023-01-24 04:57:30.079104: step: 224/530, loss: 0.023570828139781952 2023-01-24 04:57:31.133785: step: 228/530, loss: 0.04166729003190994 2023-01-24 04:57:32.187302: step: 232/530, loss: 0.007473578676581383 2023-01-24 04:57:33.247455: step: 236/530, loss: 0.022276155650615692 2023-01-24 04:57:34.284935: step: 240/530, loss: 0.011229636147618294 2023-01-24 04:57:35.330254: step: 244/530, loss: 0.010996056720614433 2023-01-24 04:57:36.389809: step: 248/530, loss: 0.020953651517629623 2023-01-24 04:57:37.455286: step: 252/530, loss: 0.014445587992668152 2023-01-24 04:57:38.501815: step: 256/530, loss: 0.041544608771800995 2023-01-24 04:57:39.546244: step: 260/530, loss: 0.0196048766374588 2023-01-24 04:57:40.589870: step: 264/530, loss: 0.01599714159965515 2023-01-24 04:57:41.635061: step: 268/530, loss: 0.07050645351409912 2023-01-24 04:57:42.676633: step: 272/530, loss: 0.0421467162668705 2023-01-24 04:57:43.728192: step: 276/530, loss: 0.010393726639449596 2023-01-24 04:57:44.769108: step: 280/530, loss: 0.06304173171520233 2023-01-24 04:57:45.823144: step: 284/530, loss: 0.01447010226547718 2023-01-24 04:57:46.884614: step: 288/530, loss: 0.025486130267381668 2023-01-24 04:57:47.947894: step: 292/530, loss: 0.05997813493013382 2023-01-24 04:57:48.986599: step: 296/530, loss: 0.022653279826045036 2023-01-24 04:57:50.028576: step: 300/530, loss: 0.04908964782953262 2023-01-24 04:57:51.086784: step: 304/530, loss: 0.01200844720005989 2023-01-24 04:57:52.150747: step: 308/530, loss: 0.0060731531120836735 2023-01-24 04:57:53.192177: step: 312/530, loss: 0.044333744794130325 2023-01-24 04:57:54.232451: step: 316/530, loss: 0.038436442613601685 2023-01-24 04:57:55.268931: step: 320/530, loss: 0.0136526795104146 2023-01-24 04:57:56.320564: step: 324/530, loss: 0.020266354084014893 2023-01-24 04:57:57.377588: step: 328/530, loss: 0.012559860944747925 2023-01-24 04:57:58.433539: step: 332/530, loss: 0.01112893782556057 2023-01-24 04:57:59.481544: step: 336/530, loss: 0.013241477310657501 2023-01-24 04:58:00.535413: step: 340/530, loss: 0.010125523433089256 2023-01-24 04:58:01.578933: step: 344/530, loss: 0.01344500482082367 2023-01-24 04:58:02.623647: step: 348/530, loss: 0.014855092391371727 2023-01-24 04:58:03.666059: step: 352/530, loss: 0.042773760855197906 2023-01-24 04:58:04.719689: step: 356/530, loss: 0.05051124840974808 2023-01-24 04:58:05.779964: step: 360/530, loss: 0.040631815791130066 2023-01-24 04:58:06.828835: step: 364/530, loss: 0.06396598368883133 2023-01-24 04:58:07.913752: step: 368/530, loss: 0.051768772304058075 2023-01-24 04:58:08.956049: step: 372/530, loss: 0.031925443559885025 2023-01-24 04:58:10.014061: step: 376/530, loss: 0.014670888893306255 2023-01-24 04:58:11.059417: step: 380/530, loss: 0.04033554345369339 2023-01-24 04:58:12.102688: step: 384/530, loss: 0.02209855057299137 2023-01-24 04:58:13.132767: step: 388/530, loss: 0.01255041267722845 2023-01-24 04:58:14.175044: step: 392/530, loss: 0.012206725776195526 2023-01-24 04:58:15.209644: step: 396/530, loss: 0.0161734726279974 2023-01-24 04:58:16.249106: step: 400/530, loss: 0.026487227529287338 2023-01-24 04:58:17.292296: step: 404/530, loss: 0.014444894157350063 2023-01-24 04:58:18.333682: step: 408/530, loss: 0.010333058424293995 2023-01-24 04:58:19.387918: step: 412/530, loss: 0.006082017906010151 2023-01-24 04:58:20.426035: step: 416/530, loss: 0.01638266071677208 2023-01-24 04:58:21.480652: step: 420/530, loss: 0.04391314834356308 2023-01-24 04:58:22.530112: step: 424/530, loss: 0.016791932284832 2023-01-24 04:58:23.572808: step: 428/530, loss: 0.013436893001198769 2023-01-24 04:58:24.653647: step: 432/530, loss: 0.02358480915427208 2023-01-24 04:58:25.691702: step: 436/530, loss: 0.009498543106019497 2023-01-24 04:58:26.750111: step: 440/530, loss: 0.009855261072516441 2023-01-24 04:58:27.792089: step: 444/530, loss: 0.017667284235358238 2023-01-24 04:58:28.840610: step: 448/530, loss: 0.04631337895989418 2023-01-24 04:58:29.889142: step: 452/530, loss: 0.014315621927380562 2023-01-24 04:58:30.932167: step: 456/530, loss: 0.01812603510916233 2023-01-24 04:58:31.993955: step: 460/530, loss: 0.04465753212571144 2023-01-24 04:58:33.052198: step: 464/530, loss: 0.03727440908551216 2023-01-24 04:58:34.101632: step: 468/530, loss: 0.012952454388141632 2023-01-24 04:58:35.156504: step: 472/530, loss: 0.046937499195337296 2023-01-24 04:58:36.211306: step: 476/530, loss: 0.05256005376577377 2023-01-24 04:58:37.258960: step: 480/530, loss: 0.01981108821928501 2023-01-24 04:58:38.297527: step: 484/530, loss: 0.011906221508979797 2023-01-24 04:58:39.334794: step: 488/530, loss: 0.020235009491443634 2023-01-24 04:58:40.364652: step: 492/530, loss: 0.0391661562025547 2023-01-24 04:58:41.425064: step: 496/530, loss: 0.01849944330751896 2023-01-24 04:58:42.476209: step: 500/530, loss: 0.036094486713409424 2023-01-24 04:58:43.511654: step: 504/530, loss: 0.04758574813604355 2023-01-24 04:58:44.571059: step: 508/530, loss: 0.008935992605984211 2023-01-24 04:58:45.606829: step: 512/530, loss: 0.010376857593655586 2023-01-24 04:58:46.661390: step: 516/530, loss: 0.0186650101095438 2023-01-24 04:58:47.709800: step: 520/530, loss: 0.04050913825631142 2023-01-24 04:58:48.755670: step: 524/530, loss: 0.013347795233130455 2023-01-24 04:58:49.803434: step: 528/530, loss: 0.0032928106375038624 2023-01-24 04:58:50.849364: step: 532/530, loss: 0.03926122188568115 2023-01-24 04:58:51.890116: step: 536/530, loss: 0.016761235892772675 2023-01-24 04:58:52.946821: step: 540/530, loss: 0.01184121798723936 2023-01-24 04:58:54.004873: step: 544/530, loss: 0.007499242201447487 2023-01-24 04:58:55.053044: step: 548/530, loss: 0.03016289323568344 2023-01-24 04:58:56.097005: step: 552/530, loss: 0.0 2023-01-24 04:58:57.152027: step: 556/530, loss: 0.06591839343309402 2023-01-24 04:58:58.187010: step: 560/530, loss: 0.016564559191465378 2023-01-24 04:58:59.232540: step: 564/530, loss: 0.040470533072948456 2023-01-24 04:59:00.276278: step: 568/530, loss: 0.013416310772299767 2023-01-24 04:59:01.328568: step: 572/530, loss: 0.013418116606771946 2023-01-24 04:59:02.376282: step: 576/530, loss: 0.026211488991975784 2023-01-24 04:59:03.420454: step: 580/530, loss: 0.010530592873692513 2023-01-24 04:59:04.454227: step: 584/530, loss: 0.006916653364896774 2023-01-24 04:59:05.503927: step: 588/530, loss: 0.023131463676691055 2023-01-24 04:59:06.542458: step: 592/530, loss: 0.008311344310641289 2023-01-24 04:59:07.598964: step: 596/530, loss: 0.010789063759148121 2023-01-24 04:59:08.628404: step: 600/530, loss: 0.013362892903387547 2023-01-24 04:59:09.668581: step: 604/530, loss: 0.0071099018678069115 2023-01-24 04:59:10.710239: step: 608/530, loss: 0.043009303510189056 2023-01-24 04:59:11.767217: step: 612/530, loss: 0.014970828779041767 2023-01-24 04:59:12.812325: step: 616/530, loss: 0.025337407365441322 2023-01-24 04:59:13.852171: step: 620/530, loss: 0.03408828750252724 2023-01-24 04:59:14.903483: step: 624/530, loss: 0.052135542035102844 2023-01-24 04:59:15.956098: step: 628/530, loss: 0.013007240369915962 2023-01-24 04:59:16.996027: step: 632/530, loss: 0.004831044934689999 2023-01-24 04:59:18.049195: step: 636/530, loss: 0.021757418289780617 2023-01-24 04:59:19.100766: step: 640/530, loss: 0.019257046282291412 2023-01-24 04:59:20.138141: step: 644/530, loss: 0.05620265007019043 2023-01-24 04:59:21.190570: step: 648/530, loss: 0.018570058047771454 2023-01-24 04:59:22.258031: step: 652/530, loss: 0.014045841060578823 2023-01-24 04:59:23.317247: step: 656/530, loss: 0.015940770506858826 2023-01-24 04:59:24.381783: step: 660/530, loss: 0.04787875711917877 2023-01-24 04:59:25.426340: step: 664/530, loss: 0.014105679467320442 2023-01-24 04:59:26.470029: step: 668/530, loss: 0.005747381132096052 2023-01-24 04:59:27.518913: step: 672/530, loss: 0.030748708173632622 2023-01-24 04:59:28.585619: step: 676/530, loss: 0.013762318529188633 2023-01-24 04:59:29.635444: step: 680/530, loss: 0.005123665556311607 2023-01-24 04:59:30.712258: step: 684/530, loss: 0.008086733520030975 2023-01-24 04:59:31.762726: step: 688/530, loss: 0.07292577624320984 2023-01-24 04:59:32.826339: step: 692/530, loss: 0.014001429080963135 2023-01-24 04:59:33.886925: step: 696/530, loss: 0.02192588895559311 2023-01-24 04:59:34.940474: step: 700/530, loss: 0.007155390921980143 2023-01-24 04:59:35.985251: step: 704/530, loss: 0.013085514307022095 2023-01-24 04:59:37.045496: step: 708/530, loss: 0.06873773038387299 2023-01-24 04:59:38.086032: step: 712/530, loss: 0.008516249246895313 2023-01-24 04:59:39.140724: step: 716/530, loss: 0.010924703441560268 2023-01-24 04:59:40.190161: step: 720/530, loss: 0.012691010721027851 2023-01-24 04:59:41.247256: step: 724/530, loss: 0.01605951227247715 2023-01-24 04:59:42.274686: step: 728/530, loss: 0.03922870010137558 2023-01-24 04:59:43.302609: step: 732/530, loss: 0.012207195162773132 2023-01-24 04:59:44.362890: step: 736/530, loss: 0.00918819010257721 2023-01-24 04:59:45.417285: step: 740/530, loss: 0.02580217644572258 2023-01-24 04:59:46.486909: step: 744/530, loss: 0.04725988581776619 2023-01-24 04:59:47.536849: step: 748/530, loss: 0.012820283882319927 2023-01-24 04:59:48.598049: step: 752/530, loss: 0.015654999762773514 2023-01-24 04:59:49.626377: step: 756/530, loss: 0.040799036622047424 2023-01-24 04:59:50.686005: step: 760/530, loss: 0.01090190839022398 2023-01-24 04:59:51.721692: step: 764/530, loss: 0.0206447821110487 2023-01-24 04:59:52.746052: step: 768/530, loss: 0.014084467664361 2023-01-24 04:59:53.783230: step: 772/530, loss: 0.01422564685344696 2023-01-24 04:59:54.814251: step: 776/530, loss: 0.021638158708810806 2023-01-24 04:59:55.883875: step: 780/530, loss: 0.013486064970493317 2023-01-24 04:59:56.951404: step: 784/530, loss: 0.012211788445711136 2023-01-24 04:59:57.989636: step: 788/530, loss: 0.008560619316995144 2023-01-24 04:59:59.045028: step: 792/530, loss: 0.010791781358420849 2023-01-24 05:00:00.098265: step: 796/530, loss: 0.003482502419501543 2023-01-24 05:00:01.161606: step: 800/530, loss: 0.028693271800875664 2023-01-24 05:00:02.211398: step: 804/530, loss: 0.016671275720000267 2023-01-24 05:00:03.252965: step: 808/530, loss: 0.012025181204080582 2023-01-24 05:00:04.299500: step: 812/530, loss: 0.00638112286105752 2023-01-24 05:00:05.336164: step: 816/530, loss: 0.025325119495391846 2023-01-24 05:00:06.382226: step: 820/530, loss: 0.011688685044646263 2023-01-24 05:00:07.454457: step: 824/530, loss: 0.017244286835193634 2023-01-24 05:00:08.497678: step: 828/530, loss: 0.02886471524834633 2023-01-24 05:00:09.549049: step: 832/530, loss: 0.008827954530715942 2023-01-24 05:00:10.601240: step: 836/530, loss: 0.009243848733603954 2023-01-24 05:00:11.660016: step: 840/530, loss: 0.0671924352645874 2023-01-24 05:00:12.711106: step: 844/530, loss: 0.008323246613144875 2023-01-24 05:00:13.756574: step: 848/530, loss: 0.02299247868359089 2023-01-24 05:00:14.801582: step: 852/530, loss: 0.007278129458427429 2023-01-24 05:00:15.865116: step: 856/530, loss: 0.013758787885308266 2023-01-24 05:00:16.909333: step: 860/530, loss: 0.0163110364228487 2023-01-24 05:00:17.976538: step: 864/530, loss: 0.020543154329061508 2023-01-24 05:00:19.016752: step: 868/530, loss: 0.0087375333532691 2023-01-24 05:00:20.067097: step: 872/530, loss: 0.01985197700560093 2023-01-24 05:00:21.098720: step: 876/530, loss: 0.009418798610568047 2023-01-24 05:00:22.134133: step: 880/530, loss: 0.021291011944413185 2023-01-24 05:00:23.171211: step: 884/530, loss: 0.004904871340841055 2023-01-24 05:00:24.225680: step: 888/530, loss: 0.006361250765621662 2023-01-24 05:00:25.287434: step: 892/530, loss: 0.01926605775952339 2023-01-24 05:00:26.335867: step: 896/530, loss: 0.008989362977445126 2023-01-24 05:00:27.376592: step: 900/530, loss: 0.008587433025240898 2023-01-24 05:00:28.424287: step: 904/530, loss: 0.013574305921792984 2023-01-24 05:00:29.468703: step: 908/530, loss: 0.014101570472121239 2023-01-24 05:00:30.521474: step: 912/530, loss: 0.02384394034743309 2023-01-24 05:00:31.556776: step: 916/530, loss: 0.013385653495788574 2023-01-24 05:00:32.617432: step: 920/530, loss: 0.009057825431227684 2023-01-24 05:00:33.688819: step: 924/530, loss: 0.006020522676408291 2023-01-24 05:00:34.736322: step: 928/530, loss: 0.02508201263844967 2023-01-24 05:00:35.782676: step: 932/530, loss: 0.01509543415158987 2023-01-24 05:00:36.838459: step: 936/530, loss: 0.045393481850624084 2023-01-24 05:00:37.890129: step: 940/530, loss: 0.010363052599132061 2023-01-24 05:00:38.926591: step: 944/530, loss: 0.00701740849763155 2023-01-24 05:00:39.977901: step: 948/530, loss: 0.005701584275811911 2023-01-24 05:00:41.028919: step: 952/530, loss: 0.010725860483944416 2023-01-24 05:00:42.062166: step: 956/530, loss: 0.030126554891467094 2023-01-24 05:00:43.110050: step: 960/530, loss: 0.06617061048746109 2023-01-24 05:00:44.160692: step: 964/530, loss: 0.01154240407049656 2023-01-24 05:00:45.214322: step: 968/530, loss: 0.034873731434345245 2023-01-24 05:00:46.255211: step: 972/530, loss: 0.07368557900190353 2023-01-24 05:00:47.302988: step: 976/530, loss: 0.05102427303791046 2023-01-24 05:00:48.340456: step: 980/530, loss: 0.011907286942005157 2023-01-24 05:00:49.395096: step: 984/530, loss: 0.020721912384033203 2023-01-24 05:00:50.433689: step: 988/530, loss: 0.01759176142513752 2023-01-24 05:00:51.476292: step: 992/530, loss: 0.0093492167070508 2023-01-24 05:00:52.534690: step: 996/530, loss: 0.008550026454031467 2023-01-24 05:00:53.599453: step: 1000/530, loss: 0.009914956986904144 2023-01-24 05:00:54.652245: step: 1004/530, loss: 0.008670113980770111 2023-01-24 05:00:55.719258: step: 1008/530, loss: 0.012163816951215267 2023-01-24 05:00:56.756861: step: 1012/530, loss: 0.03422226756811142 2023-01-24 05:00:57.809300: step: 1016/530, loss: 0.037570856511592865 2023-01-24 05:00:58.869631: step: 1020/530, loss: 0.013528211042284966 2023-01-24 05:00:59.910146: step: 1024/530, loss: 0.022508734837174416 2023-01-24 05:01:00.978596: step: 1028/530, loss: 0.009371710941195488 2023-01-24 05:01:02.038111: step: 1032/530, loss: 0.007615245878696442 2023-01-24 05:01:03.089709: step: 1036/530, loss: 0.011166317388415337 2023-01-24 05:01:04.124747: step: 1040/530, loss: 0.006640819367021322 2023-01-24 05:01:05.179748: step: 1044/530, loss: 0.02560454048216343 2023-01-24 05:01:06.259479: step: 1048/530, loss: 0.010287744924426079 2023-01-24 05:01:07.294631: step: 1052/530, loss: 0.005687665194272995 2023-01-24 05:01:08.342226: step: 1056/530, loss: 0.013990354724228382 2023-01-24 05:01:09.400135: step: 1060/530, loss: 0.014633985236287117 2023-01-24 05:01:10.445389: step: 1064/530, loss: 0.013105589896440506 2023-01-24 05:01:11.517353: step: 1068/530, loss: 0.005768314935266972 2023-01-24 05:01:12.570958: step: 1072/530, loss: 0.00640522688627243 2023-01-24 05:01:13.622101: step: 1076/530, loss: 0.005625725723803043 2023-01-24 05:01:14.669674: step: 1080/530, loss: 0.018396489322185516 2023-01-24 05:01:15.722733: step: 1084/530, loss: 0.015970518812537193 2023-01-24 05:01:16.770500: step: 1088/530, loss: 0.011452708393335342 2023-01-24 05:01:17.803266: step: 1092/530, loss: 0.006960126105695963 2023-01-24 05:01:18.845586: step: 1096/530, loss: 0.012958606705069542 2023-01-24 05:01:19.908974: step: 1100/530, loss: 0.03585435077548027 2023-01-24 05:01:20.975876: step: 1104/530, loss: 0.006065783556550741 2023-01-24 05:01:22.013429: step: 1108/530, loss: 0.01325303129851818 2023-01-24 05:01:23.067017: step: 1112/530, loss: 0.014481334015727043 2023-01-24 05:01:24.103411: step: 1116/530, loss: 0.028966834768652916 2023-01-24 05:01:25.149748: step: 1120/530, loss: 0.015271610580384731 2023-01-24 05:01:26.195606: step: 1124/530, loss: 0.020904196426272392 2023-01-24 05:01:27.241986: step: 1128/530, loss: 0.01870165951550007 2023-01-24 05:01:28.288706: step: 1132/530, loss: 0.009080823510885239 2023-01-24 05:01:29.343770: step: 1136/530, loss: 0.009103497490286827 2023-01-24 05:01:30.387242: step: 1140/530, loss: 0.0073168398812413216 2023-01-24 05:01:31.441711: step: 1144/530, loss: 0.01086410041898489 2023-01-24 05:01:32.492158: step: 1148/530, loss: 0.014534154906868935 2023-01-24 05:01:33.547495: step: 1152/530, loss: 0.009434904903173447 2023-01-24 05:01:34.607861: step: 1156/530, loss: 0.039193108677864075 2023-01-24 05:01:35.657719: step: 1160/530, loss: 0.01121500600129366 2023-01-24 05:01:36.722728: step: 1164/530, loss: 0.03556763008236885 2023-01-24 05:01:37.801396: step: 1168/530, loss: 0.048144567757844925 2023-01-24 05:01:38.840967: step: 1172/530, loss: 0.009631075896322727 2023-01-24 05:01:39.876239: step: 1176/530, loss: 0.04500937834382057 2023-01-24 05:01:40.938887: step: 1180/530, loss: 0.008284853771328926 2023-01-24 05:01:41.981216: step: 1184/530, loss: 0.038502469658851624 2023-01-24 05:01:43.024869: step: 1188/530, loss: 0.035055097192525864 2023-01-24 05:01:44.060416: step: 1192/530, loss: 0.0 2023-01-24 05:01:45.106273: step: 1196/530, loss: 0.04667744040489197 2023-01-24 05:01:46.144938: step: 1200/530, loss: 0.02551337517797947 2023-01-24 05:01:47.199183: step: 1204/530, loss: 0.022924574092030525 2023-01-24 05:01:48.221731: step: 1208/530, loss: 0.011838776990771294 2023-01-24 05:01:49.264052: step: 1212/530, loss: 0.017896490171551704 2023-01-24 05:01:50.303284: step: 1216/530, loss: 0.012125873006880283 2023-01-24 05:01:51.352387: step: 1220/530, loss: 0.008926368318498135 2023-01-24 05:01:52.393457: step: 1224/530, loss: 0.006506599485874176 2023-01-24 05:01:53.435237: step: 1228/530, loss: 0.03445328772068024 2023-01-24 05:01:54.480163: step: 1232/530, loss: 0.025107944384217262 2023-01-24 05:01:55.527405: step: 1236/530, loss: 0.07491537928581238 2023-01-24 05:01:56.573501: step: 1240/530, loss: 0.05032229796051979 2023-01-24 05:01:57.633578: step: 1244/530, loss: 0.031171901151537895 2023-01-24 05:01:58.701951: step: 1248/530, loss: 0.008107133209705353 2023-01-24 05:01:59.737023: step: 1252/530, loss: 0.012835049070417881 2023-01-24 05:02:00.783001: step: 1256/530, loss: 0.0331944115459919 2023-01-24 05:02:01.863834: step: 1260/530, loss: 0.012265531346201897 2023-01-24 05:02:02.929335: step: 1264/530, loss: 0.03081982210278511 2023-01-24 05:02:03.953464: step: 1268/530, loss: 0.017442643642425537 2023-01-24 05:02:05.005973: step: 1272/530, loss: 0.008818896487355232 2023-01-24 05:02:06.055393: step: 1276/530, loss: 0.009429981000721455 2023-01-24 05:02:07.091316: step: 1280/530, loss: 0.0068158721551299095 2023-01-24 05:02:08.142218: step: 1284/530, loss: 0.06472896039485931 2023-01-24 05:02:09.193648: step: 1288/530, loss: 0.013817965984344482 2023-01-24 05:02:10.236787: step: 1292/530, loss: 0.04319170489907265 2023-01-24 05:02:11.278732: step: 1296/530, loss: 0.00434703566133976 2023-01-24 05:02:12.336647: step: 1300/530, loss: 0.014109157957136631 2023-01-24 05:02:13.376976: step: 1304/530, loss: 0.0176323764026165 2023-01-24 05:02:14.417796: step: 1308/530, loss: 0.0253970455378294 2023-01-24 05:02:15.464615: step: 1312/530, loss: 0.016420656815171242 2023-01-24 05:02:16.517789: step: 1316/530, loss: 0.016026459634304047 2023-01-24 05:02:17.566244: step: 1320/530, loss: 0.00875675119459629 2023-01-24 05:02:18.614586: step: 1324/530, loss: 0.019109154120087624 2023-01-24 05:02:19.657255: step: 1328/530, loss: 0.02545016258955002 2023-01-24 05:02:20.719232: step: 1332/530, loss: 0.015020868740975857 2023-01-24 05:02:21.761856: step: 1336/530, loss: 0.013192745856940746 2023-01-24 05:02:22.811030: step: 1340/530, loss: 0.008076358586549759 2023-01-24 05:02:23.865780: step: 1344/530, loss: 0.01662585884332657 2023-01-24 05:02:24.904281: step: 1348/530, loss: 0.014491165056824684 2023-01-24 05:02:25.938182: step: 1352/530, loss: 0.007139723282307386 2023-01-24 05:02:26.974005: step: 1356/530, loss: 0.013656837865710258 2023-01-24 05:02:28.016662: step: 1360/530, loss: 0.01911047101020813 2023-01-24 05:02:29.062967: step: 1364/530, loss: 0.0608656108379364 2023-01-24 05:02:30.106025: step: 1368/530, loss: 0.01656697690486908 2023-01-24 05:02:31.148402: step: 1372/530, loss: 0.01165794301778078 2023-01-24 05:02:32.222657: step: 1376/530, loss: 0.007821107283234596 2023-01-24 05:02:33.273266: step: 1380/530, loss: 0.008379621431231499 2023-01-24 05:02:34.343593: step: 1384/530, loss: 0.04263940826058388 2023-01-24 05:02:35.384707: step: 1388/530, loss: 0.03730163723230362 2023-01-24 05:02:36.430744: step: 1392/530, loss: 0.04185022413730621 2023-01-24 05:02:37.486988: step: 1396/530, loss: 0.013346433639526367 2023-01-24 05:02:38.541278: step: 1400/530, loss: 0.010640447027981281 2023-01-24 05:02:39.584435: step: 1404/530, loss: 0.026997994631528854 2023-01-24 05:02:40.656976: step: 1408/530, loss: 0.03975527361035347 2023-01-24 05:02:41.718931: step: 1412/530, loss: 0.007448334246873856 2023-01-24 05:02:42.769931: step: 1416/530, loss: 0.059563349932432175 2023-01-24 05:02:43.813991: step: 1420/530, loss: 0.04467020556330681 2023-01-24 05:02:44.879987: step: 1424/530, loss: 0.015791745856404305 2023-01-24 05:02:45.915600: step: 1428/530, loss: 0.007467383984476328 2023-01-24 05:02:46.970126: step: 1432/530, loss: 0.04677760228514671 2023-01-24 05:02:48.025341: step: 1436/530, loss: 0.014661049470305443 2023-01-24 05:02:49.059175: step: 1440/530, loss: 0.04245565086603165 2023-01-24 05:02:50.117027: step: 1444/530, loss: 0.016248386353254318 2023-01-24 05:02:51.177160: step: 1448/530, loss: 0.0616140142083168 2023-01-24 05:02:52.218269: step: 1452/530, loss: 0.01275690644979477 2023-01-24 05:02:53.265867: step: 1456/530, loss: 0.018116962164640427 2023-01-24 05:02:54.310965: step: 1460/530, loss: 0.03878491371870041 2023-01-24 05:02:55.345873: step: 1464/530, loss: 0.016520487144589424 2023-01-24 05:02:56.391037: step: 1468/530, loss: 0.024132516235113144 2023-01-24 05:02:57.445697: step: 1472/530, loss: 0.04045415297150612 2023-01-24 05:02:58.492949: step: 1476/530, loss: 0.02203725278377533 2023-01-24 05:02:59.548468: step: 1480/530, loss: 0.008971241302788258 2023-01-24 05:03:00.603071: step: 1484/530, loss: 0.03543095663189888 2023-01-24 05:03:01.644979: step: 1488/530, loss: 0.01844763569533825 2023-01-24 05:03:02.681840: step: 1492/530, loss: 0.008905330672860146 2023-01-24 05:03:03.737371: step: 1496/530, loss: 0.01676773652434349 2023-01-24 05:03:04.786766: step: 1500/530, loss: 0.01816197670996189 2023-01-24 05:03:05.831892: step: 1504/530, loss: 0.013253842480480671 2023-01-24 05:03:06.869814: step: 1508/530, loss: 0.01869339309632778 2023-01-24 05:03:07.933461: step: 1512/530, loss: 0.00848846510052681 2023-01-24 05:03:08.970654: step: 1516/530, loss: 0.0009101839968934655 2023-01-24 05:03:10.023190: step: 1520/530, loss: 0.006233740597963333 2023-01-24 05:03:11.082599: step: 1524/530, loss: 0.03229101374745369 2023-01-24 05:03:12.129187: step: 1528/530, loss: 0.013248422183096409 2023-01-24 05:03:13.181110: step: 1532/530, loss: 0.009252777323126793 2023-01-24 05:03:14.231780: step: 1536/530, loss: 0.0035703161265701056 2023-01-24 05:03:15.269514: step: 1540/530, loss: 0.009456614963710308 2023-01-24 05:03:16.315608: step: 1544/530, loss: 0.009363709017634392 2023-01-24 05:03:17.363534: step: 1548/530, loss: 0.0897272378206253 2023-01-24 05:03:18.399975: step: 1552/530, loss: 0.05218866840004921 2023-01-24 05:03:19.459176: step: 1556/530, loss: 0.010671944357454777 2023-01-24 05:03:20.495149: step: 1560/530, loss: 0.008355812169611454 2023-01-24 05:03:21.539738: step: 1564/530, loss: 0.004710738081485033 2023-01-24 05:03:22.592607: step: 1568/530, loss: 0.09251004457473755 2023-01-24 05:03:23.649873: step: 1572/530, loss: 0.007496704813092947 2023-01-24 05:03:24.700435: step: 1576/530, loss: 0.01327112689614296 2023-01-24 05:03:25.731276: step: 1580/530, loss: 0.009883316233754158 2023-01-24 05:03:26.808168: step: 1584/530, loss: 0.02566574700176716 2023-01-24 05:03:27.856326: step: 1588/530, loss: 0.0 2023-01-24 05:03:28.899040: step: 1592/530, loss: 0.006210661493241787 2023-01-24 05:03:29.956626: step: 1596/530, loss: 0.014399432577192783 2023-01-24 05:03:31.007765: step: 1600/530, loss: 0.012009043246507645 2023-01-24 05:03:32.064767: step: 1604/530, loss: 0.025204863399267197 2023-01-24 05:03:33.105143: step: 1608/530, loss: 0.010684474371373653 2023-01-24 05:03:34.171020: step: 1612/530, loss: 0.008406277745962143 2023-01-24 05:03:35.218067: step: 1616/530, loss: 0.00841812789440155 2023-01-24 05:03:36.264088: step: 1620/530, loss: 0.007304898463189602 2023-01-24 05:03:37.300318: step: 1624/530, loss: 0.004615768790245056 2023-01-24 05:03:38.341636: step: 1628/530, loss: 0.03297346085309982 2023-01-24 05:03:39.388332: step: 1632/530, loss: 0.013780905865132809 2023-01-24 05:03:40.450668: step: 1636/530, loss: 0.03210994601249695 2023-01-24 05:03:41.489259: step: 1640/530, loss: 0.007842929102480412 2023-01-24 05:03:42.563057: step: 1644/530, loss: 0.008495690301060677 2023-01-24 05:03:43.605324: step: 1648/530, loss: 0.010128493420779705 2023-01-24 05:03:44.655027: step: 1652/530, loss: 0.006616923026740551 2023-01-24 05:03:45.709391: step: 1656/530, loss: 0.010074500925838947 2023-01-24 05:03:46.761564: step: 1660/530, loss: 0.03827520087361336 2023-01-24 05:03:47.800600: step: 1664/530, loss: 0.014995967969298363 2023-01-24 05:03:48.842773: step: 1668/530, loss: 0.014161030761897564 2023-01-24 05:03:49.892365: step: 1672/530, loss: 0.0067509314976632595 2023-01-24 05:03:50.932146: step: 1676/530, loss: 0.02198561280965805 2023-01-24 05:03:51.979438: step: 1680/530, loss: 0.019412247464060783 2023-01-24 05:03:53.021866: step: 1684/530, loss: 0.013593340292572975 2023-01-24 05:03:54.080928: step: 1688/530, loss: 0.06433723866939545 2023-01-24 05:03:55.127238: step: 1692/530, loss: 0.02928980253636837 2023-01-24 05:03:56.164768: step: 1696/530, loss: 0.013907265849411488 2023-01-24 05:03:57.209669: step: 1700/530, loss: 0.06132680922746658 2023-01-24 05:03:58.258027: step: 1704/530, loss: 0.0038807429373264313 2023-01-24 05:03:59.305369: step: 1708/530, loss: 0.011430630460381508 2023-01-24 05:04:00.339053: step: 1712/530, loss: 0.027682211250066757 2023-01-24 05:04:01.379886: step: 1716/530, loss: 0.029594920575618744 2023-01-24 05:04:02.437455: step: 1720/530, loss: 0.01209992915391922 2023-01-24 05:04:03.485456: step: 1724/530, loss: 0.03204839676618576 2023-01-24 05:04:04.533521: step: 1728/530, loss: 0.009996633976697922 2023-01-24 05:04:05.563592: step: 1732/530, loss: 0.01476296130567789 2023-01-24 05:04:06.627207: step: 1736/530, loss: 0.0039046211168169975 2023-01-24 05:04:07.658049: step: 1740/530, loss: 0.004724082536995411 2023-01-24 05:04:08.703458: step: 1744/530, loss: 0.01035708375275135 2023-01-24 05:04:09.763330: step: 1748/530, loss: 0.01116228848695755 2023-01-24 05:04:10.810988: step: 1752/530, loss: 0.006762249395251274 2023-01-24 05:04:11.871596: step: 1756/530, loss: 0.01807950995862484 2023-01-24 05:04:12.915950: step: 1760/530, loss: 0.00912668276578188 2023-01-24 05:04:13.966560: step: 1764/530, loss: 0.005292718298733234 2023-01-24 05:04:15.011823: step: 1768/530, loss: 0.004882217850536108 2023-01-24 05:04:16.068833: step: 1772/530, loss: 0.007848333567380905 2023-01-24 05:04:17.098536: step: 1776/530, loss: 0.004974755458533764 2023-01-24 05:04:18.160659: step: 1780/530, loss: 0.00784052163362503 2023-01-24 05:04:19.203446: step: 1784/530, loss: 0.006111221853643656 2023-01-24 05:04:20.256504: step: 1788/530, loss: 0.008439870551228523 2023-01-24 05:04:21.306593: step: 1792/530, loss: 0.007257196586579084 2023-01-24 05:04:22.346482: step: 1796/530, loss: 0.03097677417099476 2023-01-24 05:04:23.397527: step: 1800/530, loss: 0.02392994426190853 2023-01-24 05:04:24.457150: step: 1804/530, loss: 0.01921793259680271 2023-01-24 05:04:25.505123: step: 1808/530, loss: 0.0157614853233099 2023-01-24 05:04:26.539354: step: 1812/530, loss: 0.013865902088582516 2023-01-24 05:04:27.594650: step: 1816/530, loss: 0.00809855293482542 2023-01-24 05:04:28.664004: step: 1820/530, loss: 0.009653554297983646 2023-01-24 05:04:29.709605: step: 1824/530, loss: 0.009131310507655144 2023-01-24 05:04:30.760226: step: 1828/530, loss: 0.03661736845970154 2023-01-24 05:04:31.820398: step: 1832/530, loss: 0.01243253331631422 2023-01-24 05:04:32.871286: step: 1836/530, loss: 0.004411943722516298 2023-01-24 05:04:33.924164: step: 1840/530, loss: 0.034142088145017624 2023-01-24 05:04:34.979512: step: 1844/530, loss: 0.0510825589299202 2023-01-24 05:04:36.027778: step: 1848/530, loss: 0.0037943634670227766 2023-01-24 05:04:37.070883: step: 1852/530, loss: 0.007966898381710052 2023-01-24 05:04:38.139968: step: 1856/530, loss: 0.006379609927535057 2023-01-24 05:04:39.192535: step: 1860/530, loss: 0.028586218133568764 2023-01-24 05:04:40.242405: step: 1864/530, loss: 0.024182695895433426 2023-01-24 05:04:41.280597: step: 1868/530, loss: 0.012714968994259834 2023-01-24 05:04:42.331458: step: 1872/530, loss: 0.007266114931553602 2023-01-24 05:04:43.368160: step: 1876/530, loss: 0.016135327517986298 2023-01-24 05:04:44.412817: step: 1880/530, loss: 0.01627356745302677 2023-01-24 05:04:45.443867: step: 1884/530, loss: 0.010763503611087799 2023-01-24 05:04:46.497435: step: 1888/530, loss: 0.044665493071079254 2023-01-24 05:04:47.544381: step: 1892/530, loss: 0.02698495425283909 2023-01-24 05:04:48.582746: step: 1896/530, loss: 0.01269553229212761 2023-01-24 05:04:49.622515: step: 1900/530, loss: 0.006397400051355362 2023-01-24 05:04:50.706307: step: 1904/530, loss: 0.00925454031676054 2023-01-24 05:04:51.752046: step: 1908/530, loss: 0.029682034626603127 2023-01-24 05:04:52.784021: step: 1912/530, loss: 0.017402449622750282 2023-01-24 05:04:53.824169: step: 1916/530, loss: 0.006162512116134167 2023-01-24 05:04:54.877785: step: 1920/530, loss: 0.0045259553007781506 2023-01-24 05:04:55.934676: step: 1924/530, loss: 0.00969818327575922 2023-01-24 05:04:56.988139: step: 1928/530, loss: 0.008025826886296272 2023-01-24 05:04:58.041713: step: 1932/530, loss: 0.01395223569124937 2023-01-24 05:04:59.099316: step: 1936/530, loss: 0.012100683525204659 2023-01-24 05:05:00.134464: step: 1940/530, loss: 0.02019091136753559 2023-01-24 05:05:01.186946: step: 1944/530, loss: 0.018800778314471245 2023-01-24 05:05:02.230622: step: 1948/530, loss: 0.021765897050499916 2023-01-24 05:05:03.278358: step: 1952/530, loss: 0.01721109077334404 2023-01-24 05:05:04.333677: step: 1956/530, loss: 0.03487658500671387 2023-01-24 05:05:05.376654: step: 1960/530, loss: 0.006069914437830448 2023-01-24 05:05:06.428586: step: 1964/530, loss: 0.06411559134721756 2023-01-24 05:05:07.463382: step: 1968/530, loss: 0.01284013967961073 2023-01-24 05:05:08.512831: step: 1972/530, loss: 0.008704513311386108 2023-01-24 05:05:09.549282: step: 1976/530, loss: 0.0011018546065315604 2023-01-24 05:05:10.596440: step: 1980/530, loss: 0.014638877473771572 2023-01-24 05:05:11.639949: step: 1984/530, loss: 0.010074022226035595 2023-01-24 05:05:12.688904: step: 1988/530, loss: 0.031635627150535583 2023-01-24 05:05:13.738387: step: 1992/530, loss: 0.03363392874598503 2023-01-24 05:05:14.789977: step: 1996/530, loss: 0.026511678472161293 2023-01-24 05:05:15.823160: step: 2000/530, loss: 0.02227601781487465 2023-01-24 05:05:16.874584: step: 2004/530, loss: 0.022974004969000816 2023-01-24 05:05:17.928979: step: 2008/530, loss: 0.012734156101942062 2023-01-24 05:05:18.974315: step: 2012/530, loss: 0.016996197402477264 2023-01-24 05:05:20.024200: step: 2016/530, loss: 0.0056351288221776485 2023-01-24 05:05:21.075375: step: 2020/530, loss: 0.008489016443490982 2023-01-24 05:05:22.114503: step: 2024/530, loss: 0.022434482350945473 2023-01-24 05:05:23.155561: step: 2028/530, loss: 0.017772993072867393 2023-01-24 05:05:24.187259: step: 2032/530, loss: 0.012262226082384586 2023-01-24 05:05:25.220953: step: 2036/530, loss: 0.007736681494861841 2023-01-24 05:05:26.263321: step: 2040/530, loss: 0.009416958317160606 2023-01-24 05:05:27.285499: step: 2044/530, loss: 0.006539102178066969 2023-01-24 05:05:28.337713: step: 2048/530, loss: 0.007677316665649414 2023-01-24 05:05:29.373569: step: 2052/530, loss: 0.013833217322826385 2023-01-24 05:05:30.426572: step: 2056/530, loss: 0.012024348601698875 2023-01-24 05:05:31.471743: step: 2060/530, loss: 0.029821518808603287 2023-01-24 05:05:32.539389: step: 2064/530, loss: 0.003974899183958769 2023-01-24 05:05:33.598313: step: 2068/530, loss: 0.023904291912913322 2023-01-24 05:05:34.649842: step: 2072/530, loss: 0.01618839055299759 2023-01-24 05:05:35.709897: step: 2076/530, loss: 0.017006777226924896 2023-01-24 05:05:36.772135: step: 2080/530, loss: 0.03427751362323761 2023-01-24 05:05:37.806910: step: 2084/530, loss: 0.01980504021048546 2023-01-24 05:05:38.837613: step: 2088/530, loss: 0.01490362174808979 2023-01-24 05:05:39.866251: step: 2092/530, loss: 0.01789029687643051 2023-01-24 05:05:40.916397: step: 2096/530, loss: 0.004750585649162531 2023-01-24 05:05:41.956612: step: 2100/530, loss: 0.014235352165997028 2023-01-24 05:05:42.999087: step: 2104/530, loss: 0.006032113451510668 2023-01-24 05:05:44.055483: step: 2108/530, loss: 0.005484898108989 2023-01-24 05:05:45.099523: step: 2112/530, loss: 0.009656216017901897 2023-01-24 05:05:46.148205: step: 2116/530, loss: 0.005013451911509037 2023-01-24 05:05:47.176465: step: 2120/530, loss: 0.007228979840874672 ================================================== Loss: 0.022 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3738546380090498, 'r': 0.3135555028462998, 'f1': 0.34106037151702784}, 'combined': 0.25130764217044155, 'stategy': 1, 'epoch': 0} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36737558326918535, 'r': 0.3794979673183977, 'f1': 0.373338397064357}, 'combined': 0.28938191542787484, 'stategy': 1, 'epoch': 0} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38570432079081635, 'r': 0.32788526701002985, 'f1': 0.35445238095238096}, 'combined': 0.2611754385964912, 'stategy': 1, 'epoch': 0} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.35770135689369326, 'r': 0.35375612133971873, 'f1': 0.35571780038596484}, 'combined': 0.2757238452752455, 'stategy': 1, 'epoch': 0} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3831916622413657, 'r': 0.3242950310429774, 'f1': 0.35129184246587686}, 'combined': 0.2588466207643303, 'stategy': 1, 'epoch': 0} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3533647798208727, 'r': 0.3517408607959607, 'f1': 0.352550950295721}, 'combined': 0.2732691576454871, 'stategy': 1, 'epoch': 0} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 0} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.45588235294117646, 'r': 0.33695652173913043, 'f1': 0.3875}, 'combined': 0.19375, 'stategy': 1, 'epoch': 0} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6096491228070176, 'r': 0.18920145190562612, 'f1': 0.28878116343490307}, 'combined': 0.1925207756232687, 'stategy': 1, 'epoch': 0} New best chinese model... New best korean model... New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3738546380090498, 'r': 0.3135555028462998, 'f1': 0.34106037151702784}, 'combined': 0.25130764217044155, 'stategy': 1, 'epoch': 0} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36737558326918535, 'r': 0.3794979673183977, 'f1': 0.373338397064357}, 'combined': 0.28938191542787484, 'stategy': 1, 'epoch': 0} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 0} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38570432079081635, 'r': 0.32788526701002985, 'f1': 0.35445238095238096}, 'combined': 0.2611754385964912, 'stategy': 1, 'epoch': 0} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.35770135689369326, 'r': 0.35375612133971873, 'f1': 0.35571780038596484}, 'combined': 0.2757238452752455, 'stategy': 1, 'epoch': 0} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.45588235294117646, 'r': 0.33695652173913043, 'f1': 0.3875}, 'combined': 0.19375, 'stategy': 1, 'epoch': 0} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3831916622413657, 'r': 0.3242950310429774, 'f1': 0.35129184246587686}, 'combined': 0.2588466207643303, 'stategy': 1, 'epoch': 0} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3533647798208727, 'r': 0.3517408607959607, 'f1': 0.352550950295721}, 'combined': 0.2732691576454871, 'stategy': 1, 'epoch': 0} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6096491228070176, 'r': 0.18920145190562612, 'f1': 0.28878116343490307}, 'combined': 0.1925207756232687, 'stategy': 1, 'epoch': 0} ****************************** Epoch: 1 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 05:08:23.823845: step: 4/530, loss: 0.0098522137850523 2023-01-24 05:08:24.865194: step: 8/530, loss: 0.005377455148845911 2023-01-24 05:08:25.897502: step: 12/530, loss: 0.006909853778779507 2023-01-24 05:08:26.918249: step: 16/530, loss: 0.006114135030657053 2023-01-24 05:08:27.947446: step: 20/530, loss: 0.012564241886138916 2023-01-24 05:08:29.007094: step: 24/530, loss: 0.0422721803188324 2023-01-24 05:08:30.041807: step: 28/530, loss: 0.020891595631837845 2023-01-24 05:08:31.073074: step: 32/530, loss: 0.0032217446714639664 2023-01-24 05:08:32.113851: step: 36/530, loss: 0.005921873264014721 2023-01-24 05:08:33.148300: step: 40/530, loss: 0.010434969328343868 2023-01-24 05:08:34.184905: step: 44/530, loss: 0.00887048989534378 2023-01-24 05:08:35.230187: step: 48/530, loss: 0.029717912897467613 2023-01-24 05:08:36.268595: step: 52/530, loss: 0.0068167694844305515 2023-01-24 05:08:37.301713: step: 56/530, loss: 0.009218721650540829 2023-01-24 05:08:38.327073: step: 60/530, loss: 0.007991575635969639 2023-01-24 05:08:39.377158: step: 64/530, loss: 0.01888984441757202 2023-01-24 05:08:40.424964: step: 68/530, loss: 0.017180604860186577 2023-01-24 05:08:41.458797: step: 72/530, loss: 0.055858999490737915 2023-01-24 05:08:42.513327: step: 76/530, loss: 0.010794703848659992 2023-01-24 05:08:43.552922: step: 80/530, loss: 0.017841270193457603 2023-01-24 05:08:44.590672: step: 84/530, loss: 0.009985985234379768 2023-01-24 05:08:45.633059: step: 88/530, loss: 0.03523147478699684 2023-01-24 05:08:46.704845: step: 92/530, loss: 0.010065844282507896 2023-01-24 05:08:47.760890: step: 96/530, loss: 0.008606970310211182 2023-01-24 05:08:48.793214: step: 100/530, loss: 0.011893689632415771 2023-01-24 05:08:49.837084: step: 104/530, loss: 0.008819621987640858 2023-01-24 05:08:50.871202: step: 108/530, loss: 0.014171184040606022 2023-01-24 05:08:51.896963: step: 112/530, loss: 0.014161612838506699 2023-01-24 05:08:52.957050: step: 116/530, loss: 0.01990302838385105 2023-01-24 05:08:54.001571: step: 120/530, loss: 0.011115428991615772 2023-01-24 05:08:55.027188: step: 124/530, loss: 0.0008971584029495716 2023-01-24 05:08:56.086442: step: 128/530, loss: 0.013212819583714008 2023-01-24 05:08:57.131069: step: 132/530, loss: 0.013090829364955425 2023-01-24 05:08:58.186549: step: 136/530, loss: 0.00854986160993576 2023-01-24 05:08:59.233372: step: 140/530, loss: 0.00937812589108944 2023-01-24 05:09:00.290700: step: 144/530, loss: 0.005623607896268368 2023-01-24 05:09:01.327286: step: 148/530, loss: 0.03182008117437363 2023-01-24 05:09:02.388360: step: 152/530, loss: 0.011129575781524181 2023-01-24 05:09:03.425042: step: 156/530, loss: 0.006379378028213978 2023-01-24 05:09:04.479187: step: 160/530, loss: 0.009916199371218681 2023-01-24 05:09:05.550189: step: 164/530, loss: 0.011921132914721966 2023-01-24 05:09:06.614296: step: 168/530, loss: 0.019632887095212936 2023-01-24 05:09:07.650187: step: 172/530, loss: 0.00840664654970169 2023-01-24 05:09:08.709613: step: 176/530, loss: 0.010645314119756222 2023-01-24 05:09:09.738755: step: 180/530, loss: 0.01473387610167265 2023-01-24 05:09:10.780939: step: 184/530, loss: 0.001186772482469678 2023-01-24 05:09:11.835549: step: 188/530, loss: 0.011140630580484867 2023-01-24 05:09:12.891962: step: 192/530, loss: 0.049186792224645615 2023-01-24 05:09:13.951511: step: 196/530, loss: 0.008088590577244759 2023-01-24 05:09:14.988052: step: 200/530, loss: 0.0036882306449115276 2023-01-24 05:09:16.041848: step: 204/530, loss: 0.012489606626331806 2023-01-24 05:09:17.089473: step: 208/530, loss: 0.005425607319921255 2023-01-24 05:09:18.134792: step: 212/530, loss: 0.01253504678606987 2023-01-24 05:09:19.195449: step: 216/530, loss: 0.02669784426689148 2023-01-24 05:09:20.244993: step: 220/530, loss: 0.004981519188731909 2023-01-24 05:09:21.303631: step: 224/530, loss: 0.009377394802868366 2023-01-24 05:09:22.369531: step: 228/530, loss: 0.0056566959246993065 2023-01-24 05:09:23.407664: step: 232/530, loss: 0.009297311305999756 2023-01-24 05:09:24.457836: step: 236/530, loss: 0.01048303209245205 2023-01-24 05:09:25.500790: step: 240/530, loss: 0.011084770783782005 2023-01-24 05:09:26.549300: step: 244/530, loss: 0.006352561060339212 2023-01-24 05:09:27.593263: step: 248/530, loss: 0.004507776349782944 2023-01-24 05:09:28.652563: step: 252/530, loss: 0.016194891184568405 2023-01-24 05:09:29.693253: step: 256/530, loss: 0.01039045862853527 2023-01-24 05:09:30.749750: step: 260/530, loss: 0.02721661515533924 2023-01-24 05:09:31.778063: step: 264/530, loss: 0.024171089753508568 2023-01-24 05:09:32.837963: step: 268/530, loss: 0.005026126746088266 2023-01-24 05:09:33.889724: step: 272/530, loss: 0.0088877622038126 2023-01-24 05:09:34.947483: step: 276/530, loss: 0.003714266698807478 2023-01-24 05:09:35.983320: step: 280/530, loss: 0.009569758549332619 2023-01-24 05:09:37.032183: step: 284/530, loss: 0.0025022635236382484 2023-01-24 05:09:38.073295: step: 288/530, loss: 0.012150965631008148 2023-01-24 05:09:39.124151: step: 292/530, loss: 0.07076514512300491 2023-01-24 05:09:40.178669: step: 296/530, loss: 0.011095026507973671 2023-01-24 05:09:41.227036: step: 300/530, loss: 0.024889731779694557 2023-01-24 05:09:42.263714: step: 304/530, loss: 0.03508802503347397 2023-01-24 05:09:43.336699: step: 308/530, loss: 0.009202630259096622 2023-01-24 05:09:44.390782: step: 312/530, loss: 0.024294743314385414 2023-01-24 05:09:45.446255: step: 316/530, loss: 0.007532244548201561 2023-01-24 05:09:46.488567: step: 320/530, loss: 0.007840575650334358 2023-01-24 05:09:47.554837: step: 324/530, loss: 0.011313081718981266 2023-01-24 05:09:48.607762: step: 328/530, loss: 0.017736399546265602 2023-01-24 05:09:49.648051: step: 332/530, loss: 0.013835232704877853 2023-01-24 05:09:50.684193: step: 336/530, loss: 0.007591048255562782 2023-01-24 05:09:51.722172: step: 340/530, loss: 0.012173166498541832 2023-01-24 05:09:52.781818: step: 344/530, loss: 0.008337490260601044 2023-01-24 05:09:53.841813: step: 348/530, loss: 0.018094103783369064 2023-01-24 05:09:54.888300: step: 352/530, loss: 0.011654539033770561 2023-01-24 05:09:55.928407: step: 356/530, loss: 0.0037538036704063416 2023-01-24 05:09:56.973153: step: 360/530, loss: 0.011034824885427952 2023-01-24 05:09:58.007277: step: 364/530, loss: 0.008073040284216404 2023-01-24 05:09:59.049734: step: 368/530, loss: 0.008059673942625523 2023-01-24 05:10:00.109329: step: 372/530, loss: 0.007434504572302103 2023-01-24 05:10:01.155490: step: 376/530, loss: 0.021508976817131042 2023-01-24 05:10:02.204121: step: 380/530, loss: 0.00594729371368885 2023-01-24 05:10:03.248645: step: 384/530, loss: 0.004328927490860224 2023-01-24 05:10:04.291175: step: 388/530, loss: 0.019735587760806084 2023-01-24 05:10:05.340835: step: 392/530, loss: 0.03632958233356476 2023-01-24 05:10:06.406315: step: 396/530, loss: 0.009657775983214378 2023-01-24 05:10:07.458450: step: 400/530, loss: 0.02911049872636795 2023-01-24 05:10:08.502089: step: 404/530, loss: 0.04207779839634895 2023-01-24 05:10:09.526776: step: 408/530, loss: 0.018335117027163506 2023-01-24 05:10:10.576699: step: 412/530, loss: 0.01259111613035202 2023-01-24 05:10:11.645766: step: 416/530, loss: 0.04776895046234131 2023-01-24 05:10:12.700825: step: 420/530, loss: 0.008508259430527687 2023-01-24 05:10:13.751950: step: 424/530, loss: 0.005509136710315943 2023-01-24 05:10:14.793585: step: 428/530, loss: 0.022022981196641922 2023-01-24 05:10:15.836944: step: 432/530, loss: 0.005825175903737545 2023-01-24 05:10:16.895002: step: 436/530, loss: 0.006391631439328194 2023-01-24 05:10:17.940024: step: 440/530, loss: 0.029798265546560287 2023-01-24 05:10:18.980672: step: 444/530, loss: 0.01169007271528244 2023-01-24 05:10:20.018001: step: 448/530, loss: 0.00993143580853939 2023-01-24 05:10:21.068391: step: 452/530, loss: 0.023017197847366333 2023-01-24 05:10:22.121289: step: 456/530, loss: 0.045980166643857956 2023-01-24 05:10:23.191477: step: 460/530, loss: 0.0062423935160040855 2023-01-24 05:10:24.232997: step: 464/530, loss: 0.02088567614555359 2023-01-24 05:10:25.293404: step: 468/530, loss: 0.0356353335082531 2023-01-24 05:10:26.343335: step: 472/530, loss: 0.006775871384888887 2023-01-24 05:10:27.392230: step: 476/530, loss: 0.02590928040444851 2023-01-24 05:10:28.438486: step: 480/530, loss: 0.02843741700053215 2023-01-24 05:10:29.481038: step: 484/530, loss: 0.011266574263572693 2023-01-24 05:10:30.536605: step: 488/530, loss: 0.01505152229219675 2023-01-24 05:10:31.583738: step: 492/530, loss: 0.018635883927345276 2023-01-24 05:10:32.633127: step: 496/530, loss: 0.024898337200284004 2023-01-24 05:10:33.678383: step: 500/530, loss: 0.0 2023-01-24 05:10:34.709609: step: 504/530, loss: 0.0073678456246852875 2023-01-24 05:10:35.755064: step: 508/530, loss: 0.00479509960860014 2023-01-24 05:10:36.781582: step: 512/530, loss: 0.022892314940690994 2023-01-24 05:10:37.830414: step: 516/530, loss: 0.018966952338814735 2023-01-24 05:10:38.872007: step: 520/530, loss: 0.00934302806854248 2023-01-24 05:10:39.932437: step: 524/530, loss: 0.006274034269154072 2023-01-24 05:10:40.972628: step: 528/530, loss: 0.010546999052166939 2023-01-24 05:10:42.021481: step: 532/530, loss: 0.052468761801719666 2023-01-24 05:10:43.060750: step: 536/530, loss: 0.06969141960144043 2023-01-24 05:10:44.105484: step: 540/530, loss: 0.010747411288321018 2023-01-24 05:10:45.172463: step: 544/530, loss: 0.009659159928560257 2023-01-24 05:10:46.223610: step: 548/530, loss: 0.016071975231170654 2023-01-24 05:10:47.260342: step: 552/530, loss: 0.007158543914556503 2023-01-24 05:10:48.315940: step: 556/530, loss: 0.009879428893327713 2023-01-24 05:10:49.376661: step: 560/530, loss: 0.0037339518312364817 2023-01-24 05:10:50.427965: step: 564/530, loss: 0.007042306941002607 2023-01-24 05:10:51.473945: step: 568/530, loss: 0.05043751746416092 2023-01-24 05:10:52.521837: step: 572/530, loss: 0.004624256398528814 2023-01-24 05:10:53.553634: step: 576/530, loss: 0.0010471967980265617 2023-01-24 05:10:54.587310: step: 580/530, loss: 0.00454417709261179 2023-01-24 05:10:55.632631: step: 584/530, loss: 0.014900184236466885 2023-01-24 05:10:56.657887: step: 588/530, loss: 0.005375597160309553 2023-01-24 05:10:57.694352: step: 592/530, loss: 0.005241508595645428 2023-01-24 05:10:58.746076: step: 596/530, loss: 0.060182321816682816 2023-01-24 05:10:59.799041: step: 600/530, loss: 0.03885366767644882 2023-01-24 05:11:00.849410: step: 604/530, loss: 0.0677824541926384 2023-01-24 05:11:01.901888: step: 608/530, loss: 0.009053359739482403 2023-01-24 05:11:02.951664: step: 612/530, loss: 0.019364645704627037 2023-01-24 05:11:04.002933: step: 616/530, loss: 0.04223789647221565 2023-01-24 05:11:05.067508: step: 620/530, loss: 0.010694325901567936 2023-01-24 05:11:06.120018: step: 624/530, loss: 0.0040028151124715805 2023-01-24 05:11:07.177116: step: 628/530, loss: 0.023425258696079254 2023-01-24 05:11:08.219404: step: 632/530, loss: 0.0030718552879989147 2023-01-24 05:11:09.265024: step: 636/530, loss: 0.0242239348590374 2023-01-24 05:11:10.301306: step: 640/530, loss: 0.006455741822719574 2023-01-24 05:11:11.341315: step: 644/530, loss: 0.0049271429888904095 2023-01-24 05:11:12.369687: step: 648/530, loss: 0.007410630118101835 2023-01-24 05:11:13.424486: step: 652/530, loss: 0.020723998546600342 2023-01-24 05:11:14.468057: step: 656/530, loss: 0.0067084855400025845 2023-01-24 05:11:15.517526: step: 660/530, loss: 0.005124341230839491 2023-01-24 05:11:16.574723: step: 664/530, loss: 0.02306445688009262 2023-01-24 05:11:17.620039: step: 668/530, loss: 0.018467148765921593 2023-01-24 05:11:18.704299: step: 672/530, loss: 0.008959340862929821 2023-01-24 05:11:19.747564: step: 676/530, loss: 0.0060637579299509525 2023-01-24 05:11:20.788137: step: 680/530, loss: 0.004548309836536646 2023-01-24 05:11:21.851625: step: 684/530, loss: 0.004471042193472385 2023-01-24 05:11:22.907830: step: 688/530, loss: 0.006043381057679653 2023-01-24 05:11:23.945885: step: 692/530, loss: 0.008091883733868599 2023-01-24 05:11:24.986231: step: 696/530, loss: 0.008449411951005459 2023-01-24 05:11:26.034762: step: 700/530, loss: 0.014556603506207466 2023-01-24 05:11:27.067875: step: 704/530, loss: 0.005651827435940504 2023-01-24 05:11:28.145356: step: 708/530, loss: 0.03851265832781792 2023-01-24 05:11:29.190110: step: 712/530, loss: 0.007113317959010601 2023-01-24 05:11:30.244735: step: 716/530, loss: 0.0061908201314508915 2023-01-24 05:11:31.277153: step: 720/530, loss: 0.003702000714838505 2023-01-24 05:11:32.327134: step: 724/530, loss: 0.007190654054284096 2023-01-24 05:11:33.396254: step: 728/530, loss: 0.009460589848458767 2023-01-24 05:11:34.444093: step: 732/530, loss: 0.009790292009711266 2023-01-24 05:11:35.505632: step: 736/530, loss: 0.05745977908372879 2023-01-24 05:11:36.574188: step: 740/530, loss: 0.025261517614126205 2023-01-24 05:11:37.621478: step: 744/530, loss: 0.03459774702787399 2023-01-24 05:11:38.664971: step: 748/530, loss: 0.005876890383660793 2023-01-24 05:11:39.727224: step: 752/530, loss: 0.016318483278155327 2023-01-24 05:11:40.788768: step: 756/530, loss: 0.0425649918615818 2023-01-24 05:11:41.832542: step: 760/530, loss: 0.01010993029922247 2023-01-24 05:11:42.885056: step: 764/530, loss: 0.011428799480199814 2023-01-24 05:11:43.934043: step: 768/530, loss: 0.01426747441291809 2023-01-24 05:11:44.971918: step: 772/530, loss: 0.009529833681881428 2023-01-24 05:11:46.013103: step: 776/530, loss: 0.047059934586286545 2023-01-24 05:11:47.074066: step: 780/530, loss: 0.02529189921915531 2023-01-24 05:11:48.117923: step: 784/530, loss: 0.007859750650823116 2023-01-24 05:11:49.166495: step: 788/530, loss: 0.01606394723057747 2023-01-24 05:11:50.204564: step: 792/530, loss: 0.009316043928265572 2023-01-24 05:11:51.271856: step: 796/530, loss: 0.005559139885008335 2023-01-24 05:11:52.318920: step: 800/530, loss: 0.03796050325036049 2023-01-24 05:11:53.352129: step: 804/530, loss: 0.031788360327482224 2023-01-24 05:11:54.388444: step: 808/530, loss: 0.008990352973341942 2023-01-24 05:11:55.440001: step: 812/530, loss: 0.00991953257471323 2023-01-24 05:11:56.485631: step: 816/530, loss: 0.0075381132774055 2023-01-24 05:11:57.522723: step: 820/530, loss: 0.0027112795505672693 2023-01-24 05:11:58.566630: step: 824/530, loss: 0.009086180478334427 2023-01-24 05:11:59.624026: step: 828/530, loss: 0.005719413049519062 2023-01-24 05:12:00.674451: step: 832/530, loss: 0.006139660254120827 2023-01-24 05:12:01.725220: step: 836/530, loss: 0.01109407190233469 2023-01-24 05:12:02.768098: step: 840/530, loss: 0.015826737508177757 2023-01-24 05:12:03.832932: step: 844/530, loss: 0.010260578244924545 2023-01-24 05:12:04.878594: step: 848/530, loss: 0.07133742421865463 2023-01-24 05:12:05.936219: step: 852/530, loss: 0.005036797374486923 2023-01-24 05:12:06.974816: step: 856/530, loss: 0.0015289344592019916 2023-01-24 05:12:08.004635: step: 860/530, loss: 0.004141239915043116 2023-01-24 05:12:09.050202: step: 864/530, loss: 0.0076431892812252045 2023-01-24 05:12:10.084481: step: 868/530, loss: 0.039615388959646225 2023-01-24 05:12:11.130715: step: 872/530, loss: 0.00718665961176157 2023-01-24 05:12:12.181680: step: 876/530, loss: 0.012222104705870152 2023-01-24 05:12:13.234655: step: 880/530, loss: 0.004468315746635199 2023-01-24 05:12:14.287279: step: 884/530, loss: 0.012883608229458332 2023-01-24 05:12:15.344770: step: 888/530, loss: 0.0043690563179552555 2023-01-24 05:12:16.386343: step: 892/530, loss: 0.004753664135932922 2023-01-24 05:12:17.430935: step: 896/530, loss: 0.011920920573174953 2023-01-24 05:12:18.473109: step: 900/530, loss: 0.02754632756114006 2023-01-24 05:12:19.512456: step: 904/530, loss: 0.0001700153516139835 2023-01-24 05:12:20.552021: step: 908/530, loss: 0.020358387380838394 2023-01-24 05:12:21.600925: step: 912/530, loss: 0.007957402616739273 2023-01-24 05:12:22.642371: step: 916/530, loss: 0.012252870947122574 2023-01-24 05:12:23.692512: step: 920/530, loss: 0.0145163768902421 2023-01-24 05:12:24.761839: step: 924/530, loss: 0.02983572706580162 2023-01-24 05:12:25.810433: step: 928/530, loss: 0.0035612699575722218 2023-01-24 05:12:26.857808: step: 932/530, loss: 0.0055160121992230415 2023-01-24 05:12:27.909791: step: 936/530, loss: 0.055421456694602966 2023-01-24 05:12:28.959081: step: 940/530, loss: 0.007808417547494173 2023-01-24 05:12:29.991840: step: 944/530, loss: 0.012586615048348904 2023-01-24 05:12:31.033537: step: 948/530, loss: 0.004396616481244564 2023-01-24 05:12:32.084180: step: 952/530, loss: 0.00525481766089797 2023-01-24 05:12:33.148979: step: 956/530, loss: 0.02059188112616539 2023-01-24 05:12:34.185533: step: 960/530, loss: 0.003952351398766041 2023-01-24 05:12:35.249147: step: 964/530, loss: 0.01580275222659111 2023-01-24 05:12:36.305355: step: 968/530, loss: 0.007135107647627592 2023-01-24 05:12:37.343486: step: 972/530, loss: 0.006866042967885733 2023-01-24 05:12:38.381088: step: 976/530, loss: 0.005642477422952652 2023-01-24 05:12:39.434701: step: 980/530, loss: 0.0032362625934183598 2023-01-24 05:12:40.474855: step: 984/530, loss: 0.01378723606467247 2023-01-24 05:12:41.506226: step: 988/530, loss: 0.047178059816360474 2023-01-24 05:12:42.551176: step: 992/530, loss: 0.004135483410209417 2023-01-24 05:12:43.599776: step: 996/530, loss: 0.05625234916806221 2023-01-24 05:12:44.662969: step: 1000/530, loss: 0.008552772924304008 2023-01-24 05:12:45.716971: step: 1004/530, loss: 0.005845270119607449 2023-01-24 05:12:46.759619: step: 1008/530, loss: 0.0006229244754649699 2023-01-24 05:12:47.790767: step: 1012/530, loss: 0.052640024572610855 2023-01-24 05:12:48.835389: step: 1016/530, loss: 0.003908698447048664 2023-01-24 05:12:49.867894: step: 1020/530, loss: 0.006324539426714182 2023-01-24 05:12:50.923700: step: 1024/530, loss: 0.027349544689059258 2023-01-24 05:12:51.994678: step: 1028/530, loss: 0.008202177472412586 2023-01-24 05:12:53.039274: step: 1032/530, loss: 0.0035938865039497614 2023-01-24 05:12:54.098439: step: 1036/530, loss: 0.040193237364292145 2023-01-24 05:12:55.147530: step: 1040/530, loss: 0.011916923336684704 2023-01-24 05:12:56.187968: step: 1044/530, loss: 0.03896845132112503 2023-01-24 05:12:57.221206: step: 1048/530, loss: 0.002595658414065838 2023-01-24 05:12:58.269368: step: 1052/530, loss: 0.012275359593331814 2023-01-24 05:12:59.311616: step: 1056/530, loss: 0.007934757508337498 2023-01-24 05:13:00.345879: step: 1060/530, loss: 0.03688136115670204 2023-01-24 05:13:01.390705: step: 1064/530, loss: 0.04775184020400047 2023-01-24 05:13:02.440710: step: 1068/530, loss: 0.007793552242219448 2023-01-24 05:13:03.486612: step: 1072/530, loss: 0.020563939586281776 2023-01-24 05:13:04.529501: step: 1076/530, loss: 0.0057910131290555 2023-01-24 05:13:05.584403: step: 1080/530, loss: 0.007447263225913048 2023-01-24 05:13:06.603977: step: 1084/530, loss: 0.008960508741438389 2023-01-24 05:13:07.645787: step: 1088/530, loss: 0.0017355165909975767 2023-01-24 05:13:08.677151: step: 1092/530, loss: 0.009154271334409714 2023-01-24 05:13:09.723180: step: 1096/530, loss: 0.003979458473622799 2023-01-24 05:13:10.773841: step: 1100/530, loss: 0.0004259079578332603 2023-01-24 05:13:11.824686: step: 1104/530, loss: 0.06848970055580139 2023-01-24 05:13:12.867501: step: 1108/530, loss: 0.008959291502833366 2023-01-24 05:13:13.942981: step: 1112/530, loss: 0.055906157940626144 2023-01-24 05:13:14.996181: step: 1116/530, loss: 0.005702725611627102 2023-01-24 05:13:16.046197: step: 1120/530, loss: 0.008533775806427002 2023-01-24 05:13:17.072765: step: 1124/530, loss: 0.008413284085690975 2023-01-24 05:13:18.113748: step: 1128/530, loss: 0.0384943000972271 2023-01-24 05:13:19.177092: step: 1132/530, loss: 0.01024586521089077 2023-01-24 05:13:20.236072: step: 1136/530, loss: 0.04789073020219803 2023-01-24 05:13:21.299690: step: 1140/530, loss: 0.03734603896737099 2023-01-24 05:13:22.346455: step: 1144/530, loss: 0.0354679711163044 2023-01-24 05:13:23.388993: step: 1148/530, loss: 0.0037439875304698944 2023-01-24 05:13:24.427244: step: 1152/530, loss: 0.012498389929533005 2023-01-24 05:13:25.464923: step: 1156/530, loss: 0.0037895317655056715 2023-01-24 05:13:26.501021: step: 1160/530, loss: 0.039169687777757645 2023-01-24 05:13:27.544927: step: 1164/530, loss: 0.004299154505133629 2023-01-24 05:13:28.602547: step: 1168/530, loss: 0.009770425036549568 2023-01-24 05:13:29.642474: step: 1172/530, loss: 0.03396693617105484 2023-01-24 05:13:30.684736: step: 1176/530, loss: 0.0054685091599822044 2023-01-24 05:13:31.735784: step: 1180/530, loss: 0.008923575282096863 2023-01-24 05:13:32.765047: step: 1184/530, loss: 0.01791532151401043 2023-01-24 05:13:33.830012: step: 1188/530, loss: 0.024384457617998123 2023-01-24 05:13:34.874268: step: 1192/530, loss: 0.01159385871142149 2023-01-24 05:13:35.906402: step: 1196/530, loss: 0.009178542532026768 2023-01-24 05:13:36.947588: step: 1200/530, loss: 0.024461396038532257 2023-01-24 05:13:37.994861: step: 1204/530, loss: 0.009322012774646282 2023-01-24 05:13:39.045742: step: 1208/530, loss: 0.03786756470799446 2023-01-24 05:13:40.112939: step: 1212/530, loss: 0.030062632635235786 2023-01-24 05:13:41.163599: step: 1216/530, loss: 0.007791387382894754 2023-01-24 05:13:42.214220: step: 1220/530, loss: 0.033344484865665436 2023-01-24 05:13:43.268289: step: 1224/530, loss: 0.004832225851714611 2023-01-24 05:13:44.314844: step: 1228/530, loss: 0.009263737127184868 2023-01-24 05:13:45.367765: step: 1232/530, loss: 0.007348473183810711 2023-01-24 05:13:46.416832: step: 1236/530, loss: 0.0008141044527292252 2023-01-24 05:13:47.459040: step: 1240/530, loss: 0.002374466508626938 2023-01-24 05:13:48.502363: step: 1244/530, loss: 0.016089728102087975 2023-01-24 05:13:49.532561: step: 1248/530, loss: 0.019337480887770653 2023-01-24 05:13:50.579906: step: 1252/530, loss: 0.021364131942391396 2023-01-24 05:13:51.621950: step: 1256/530, loss: 0.006602568086236715 2023-01-24 05:13:52.681136: step: 1260/530, loss: 0.0068792556412518024 2023-01-24 05:13:53.732674: step: 1264/530, loss: 0.004075265489518642 2023-01-24 05:13:54.776736: step: 1268/530, loss: 0.041897740215063095 2023-01-24 05:13:55.811211: step: 1272/530, loss: 0.0036564639303833246 2023-01-24 05:13:56.859955: step: 1276/530, loss: 0.0477060005068779 2023-01-24 05:13:57.919056: step: 1280/530, loss: 0.011061074212193489 2023-01-24 05:13:58.949225: step: 1284/530, loss: 0.0031509497202932835 2023-01-24 05:14:00.005963: step: 1288/530, loss: 0.024852100759744644 2023-01-24 05:14:01.051000: step: 1292/530, loss: 0.005682656541466713 2023-01-24 05:14:02.086916: step: 1296/530, loss: 0.0020805818494409323 2023-01-24 05:14:03.151655: step: 1300/530, loss: 0.005957027431577444 2023-01-24 05:14:04.184096: step: 1304/530, loss: 0.003713820595294237 2023-01-24 05:14:05.227545: step: 1308/530, loss: 0.0174169410020113 2023-01-24 05:14:06.269570: step: 1312/530, loss: 0.005139423068612814 2023-01-24 05:14:07.330680: step: 1316/530, loss: 0.008227752521634102 2023-01-24 05:14:08.371291: step: 1320/530, loss: 0.05675537511706352 2023-01-24 05:14:09.412164: step: 1324/530, loss: 0.006580718792974949 2023-01-24 05:14:10.452841: step: 1328/530, loss: 0.0034125992096960545 2023-01-24 05:14:11.527863: step: 1332/530, loss: 0.003971177618950605 2023-01-24 05:14:12.573989: step: 1336/530, loss: 0.006256772205233574 2023-01-24 05:14:13.607598: step: 1340/530, loss: 0.01535890344530344 2023-01-24 05:14:14.658128: step: 1344/530, loss: 0.009639522060751915 2023-01-24 05:14:15.715951: step: 1348/530, loss: 0.005839204881340265 2023-01-24 05:14:16.737822: step: 1352/530, loss: 0.0015847495524212718 2023-01-24 05:14:17.769876: step: 1356/530, loss: 0.004766490776091814 2023-01-24 05:14:18.815303: step: 1360/530, loss: 0.005338684655725956 2023-01-24 05:14:19.862451: step: 1364/530, loss: 0.009421211667358875 2023-01-24 05:14:20.916133: step: 1368/530, loss: 0.03505420684814453 2023-01-24 05:14:21.953542: step: 1372/530, loss: 0.02362665720283985 2023-01-24 05:14:22.996889: step: 1376/530, loss: 0.007698682602494955 2023-01-24 05:14:24.052973: step: 1380/530, loss: 0.03625423461198807 2023-01-24 05:14:25.087890: step: 1384/530, loss: 0.014150853268802166 2023-01-24 05:14:26.128117: step: 1388/530, loss: 0.05872374773025513 2023-01-24 05:14:27.178464: step: 1392/530, loss: 0.01388158556073904 2023-01-24 05:14:28.220814: step: 1396/530, loss: 0.01011976320296526 2023-01-24 05:14:29.265358: step: 1400/530, loss: 0.007690747268497944 2023-01-24 05:14:30.306481: step: 1404/530, loss: 0.014599599875509739 2023-01-24 05:14:31.367515: step: 1408/530, loss: 0.0070943161845207214 2023-01-24 05:14:32.402755: step: 1412/530, loss: 0.027554038912057877 2023-01-24 05:14:33.465083: step: 1416/530, loss: 0.009707432240247726 2023-01-24 05:14:34.521128: step: 1420/530, loss: 0.010745974257588387 2023-01-24 05:14:35.566433: step: 1424/530, loss: 0.010067526251077652 2023-01-24 05:14:36.608941: step: 1428/530, loss: 0.015290834940969944 2023-01-24 05:14:37.651510: step: 1432/530, loss: 0.02790786139667034 2023-01-24 05:14:38.697271: step: 1436/530, loss: 0.008694365620613098 2023-01-24 05:14:39.737933: step: 1440/530, loss: 0.005010063759982586 2023-01-24 05:14:40.800997: step: 1444/530, loss: 0.017848588526248932 2023-01-24 05:14:41.846869: step: 1448/530, loss: 0.008178862743079662 2023-01-24 05:14:42.897858: step: 1452/530, loss: 0.006831485778093338 2023-01-24 05:14:43.931121: step: 1456/530, loss: 0.008371623232960701 2023-01-24 05:14:44.978783: step: 1460/530, loss: 0.004503347910940647 2023-01-24 05:14:46.005846: step: 1464/530, loss: 0.005053850822150707 2023-01-24 05:14:47.053632: step: 1468/530, loss: 0.01969132013618946 2023-01-24 05:14:48.107842: step: 1472/530, loss: 0.005457093007862568 2023-01-24 05:14:49.150993: step: 1476/530, loss: 0.0063288272358477116 2023-01-24 05:14:50.189169: step: 1480/530, loss: 0.029903246089816093 2023-01-24 05:14:51.213286: step: 1484/530, loss: 0.004398359451442957 2023-01-24 05:14:52.259753: step: 1488/530, loss: 0.0025383245665580034 2023-01-24 05:14:53.311225: step: 1492/530, loss: 0.012691888958215714 2023-01-24 05:14:54.352627: step: 1496/530, loss: 0.008883957751095295 2023-01-24 05:14:55.426558: step: 1500/530, loss: 0.006874787621200085 2023-01-24 05:14:56.439964: step: 1504/530, loss: 0.007974770851433277 2023-01-24 05:14:57.486723: step: 1508/530, loss: 0.03388189896941185 2023-01-24 05:14:58.530700: step: 1512/530, loss: 0.011024592444300652 2023-01-24 05:14:59.560782: step: 1516/530, loss: 0.006327065173536539 2023-01-24 05:15:00.593121: step: 1520/530, loss: 0.009689447470009327 2023-01-24 05:15:01.636962: step: 1524/530, loss: 0.026437874883413315 2023-01-24 05:15:02.696680: step: 1528/530, loss: 0.02019422873854637 2023-01-24 05:15:03.744127: step: 1532/530, loss: 0.007898754440248013 2023-01-24 05:15:05.138386: step: 1536/530, loss: 0.004939930513501167 2023-01-24 05:15:06.165760: step: 1540/530, loss: 0.0023355563171207905 2023-01-24 05:15:07.219647: step: 1544/530, loss: 0.054159652441740036 2023-01-24 05:15:08.305294: step: 1548/530, loss: 0.006251053884625435 2023-01-24 05:15:09.359428: step: 1552/530, loss: 0.0070323399268090725 2023-01-24 05:15:10.406652: step: 1556/530, loss: 0.010830866172909737 2023-01-24 05:15:11.454952: step: 1560/530, loss: 0.006331013515591621 2023-01-24 05:15:12.491624: step: 1564/530, loss: 0.0013545668916776776 2023-01-24 05:15:13.539994: step: 1568/530, loss: 0.006860048044472933 2023-01-24 05:15:14.586925: step: 1572/530, loss: 0.0074236588552594185 2023-01-24 05:15:15.623447: step: 1576/530, loss: 0.010446438565850258 2023-01-24 05:15:16.670925: step: 1580/530, loss: 0.055162906646728516 2023-01-24 05:15:17.717944: step: 1584/530, loss: 0.009249155409634113 2023-01-24 05:15:18.745800: step: 1588/530, loss: 0.006983056664466858 2023-01-24 05:15:19.779477: step: 1592/530, loss: 0.021442275494337082 2023-01-24 05:15:20.835893: step: 1596/530, loss: 0.0056538968347013 2023-01-24 05:15:21.877532: step: 1600/530, loss: 0.0027356247883290052 2023-01-24 05:15:22.941014: step: 1604/530, loss: 0.03917904943227768 2023-01-24 05:15:23.976288: step: 1608/530, loss: 0.008144271560013294 2023-01-24 05:15:25.046115: step: 1612/530, loss: 0.0070854779332876205 2023-01-24 05:15:26.103571: step: 1616/530, loss: 0.004183290060609579 2023-01-24 05:15:27.148204: step: 1620/530, loss: 0.016147736459970474 2023-01-24 05:15:28.187922: step: 1624/530, loss: 0.010289404541254044 2023-01-24 05:15:29.229864: step: 1628/530, loss: 0.024762019515037537 2023-01-24 05:15:30.266394: step: 1632/530, loss: 0.0047640688717365265 2023-01-24 05:15:31.313106: step: 1636/530, loss: 0.023279661312699318 2023-01-24 05:15:32.368624: step: 1640/530, loss: 0.005377603694796562 2023-01-24 05:15:33.429426: step: 1644/530, loss: 0.006198327522724867 2023-01-24 05:15:34.486839: step: 1648/530, loss: 0.008368727751076221 2023-01-24 05:15:35.524033: step: 1652/530, loss: 0.0076696304604411125 2023-01-24 05:15:36.558031: step: 1656/530, loss: 0.008824929594993591 2023-01-24 05:15:37.610416: step: 1660/530, loss: 0.007002229802310467 2023-01-24 05:15:38.651930: step: 1664/530, loss: 0.0011630707886070013 2023-01-24 05:15:39.705342: step: 1668/530, loss: 0.01879848539829254 2023-01-24 05:15:40.760684: step: 1672/530, loss: 0.03044995665550232 2023-01-24 05:15:41.801670: step: 1676/530, loss: 0.01741773635149002 2023-01-24 05:15:42.860432: step: 1680/530, loss: 0.02012798935174942 2023-01-24 05:15:43.914750: step: 1684/530, loss: 0.01884358376264572 2023-01-24 05:15:44.974895: step: 1688/530, loss: 0.030331740155816078 2023-01-24 05:15:46.014901: step: 1692/530, loss: 0.017635803669691086 2023-01-24 05:15:47.055610: step: 1696/530, loss: 0.01589863933622837 2023-01-24 05:15:48.094413: step: 1700/530, loss: 0.02311134524643421 2023-01-24 05:15:49.148376: step: 1704/530, loss: 0.01039676833897829 2023-01-24 05:15:50.197521: step: 1708/530, loss: 0.01273310650140047 2023-01-24 05:15:51.238254: step: 1712/530, loss: 0.03517500311136246 2023-01-24 05:15:52.285202: step: 1716/530, loss: 0.014377455227077007 2023-01-24 05:15:53.335861: step: 1720/530, loss: 0.016340885311365128 2023-01-24 05:15:54.378202: step: 1724/530, loss: 0.043678149580955505 2023-01-24 05:15:55.439436: step: 1728/530, loss: 0.007197216618806124 2023-01-24 05:15:56.481626: step: 1732/530, loss: 0.015771903097629547 2023-01-24 05:15:57.510682: step: 1736/530, loss: 0.006788188125938177 2023-01-24 05:15:58.561915: step: 1740/530, loss: 0.00735519640147686 2023-01-24 05:15:59.614346: step: 1744/530, loss: 0.006124390289187431 2023-01-24 05:16:00.639893: step: 1748/530, loss: 0.011308558285236359 2023-01-24 05:16:01.673337: step: 1752/530, loss: 0.008210016414523125 2023-01-24 05:16:02.715823: step: 1756/530, loss: 0.00381703139282763 2023-01-24 05:16:03.781844: step: 1760/530, loss: 0.013667646795511246 2023-01-24 05:16:04.817294: step: 1764/530, loss: 0.05354391783475876 2023-01-24 05:16:05.848803: step: 1768/530, loss: 0.01885106787085533 2023-01-24 05:16:06.893298: step: 1772/530, loss: 0.024088315665721893 2023-01-24 05:16:07.939805: step: 1776/530, loss: 0.007580232340842485 2023-01-24 05:16:08.977479: step: 1780/530, loss: 0.004514814354479313 2023-01-24 05:16:10.016431: step: 1784/530, loss: 0.028666427358984947 2023-01-24 05:16:11.056940: step: 1788/530, loss: 0.008676419965922832 2023-01-24 05:16:12.099497: step: 1792/530, loss: 0.00014260236639529467 2023-01-24 05:16:13.140740: step: 1796/530, loss: 0.03250482305884361 2023-01-24 05:16:14.198599: step: 1800/530, loss: 0.009149912744760513 2023-01-24 05:16:15.225719: step: 1804/530, loss: 0.02026919089257717 2023-01-24 05:16:16.271022: step: 1808/530, loss: 0.007581941317766905 2023-01-24 05:16:17.341964: step: 1812/530, loss: 0.0193567406386137 2023-01-24 05:16:18.386122: step: 1816/530, loss: 0.006984817795455456 2023-01-24 05:16:19.444871: step: 1820/530, loss: 0.013768985867500305 2023-01-24 05:16:20.483590: step: 1824/530, loss: 0.009857522323727608 2023-01-24 05:16:21.547350: step: 1828/530, loss: 0.005508939735591412 2023-01-24 05:16:22.582173: step: 1832/530, loss: 0.012291674502193928 2023-01-24 05:16:23.622571: step: 1836/530, loss: 0.012963545508682728 2023-01-24 05:16:24.651356: step: 1840/530, loss: 0.010597094893455505 2023-01-24 05:16:25.681101: step: 1844/530, loss: 0.00932835228741169 2023-01-24 05:16:26.742042: step: 1848/530, loss: 0.02392713539302349 2023-01-24 05:16:27.771147: step: 1852/530, loss: 0.031300920993089676 2023-01-24 05:16:28.825038: step: 1856/530, loss: 0.008835088461637497 2023-01-24 05:16:29.882988: step: 1860/530, loss: 0.011457874439656734 2023-01-24 05:16:30.918362: step: 1864/530, loss: 0.007875129580497742 2023-01-24 05:16:31.964675: step: 1868/530, loss: 0.0017395004397258162 2023-01-24 05:16:33.009636: step: 1872/530, loss: 0.005940976087003946 2023-01-24 05:16:34.073386: step: 1876/530, loss: 0.03783702105283737 2023-01-24 05:16:35.115132: step: 1880/530, loss: 0.0 2023-01-24 05:16:36.152341: step: 1884/530, loss: 0.007909106090664864 2023-01-24 05:16:37.183046: step: 1888/530, loss: 0.003788345493376255 2023-01-24 05:16:38.242104: step: 1892/530, loss: 0.00865496788173914 2023-01-24 05:16:39.304829: step: 1896/530, loss: 0.014837266877293587 2023-01-24 05:16:40.351886: step: 1900/530, loss: 0.0070227100513875484 2023-01-24 05:16:41.382045: step: 1904/530, loss: 0.004161282442510128 2023-01-24 05:16:42.424149: step: 1908/530, loss: 0.007852397859096527 2023-01-24 05:16:43.466099: step: 1912/530, loss: 0.009977038949728012 2023-01-24 05:16:44.531678: step: 1916/530, loss: 0.013254792429506779 2023-01-24 05:16:45.573775: step: 1920/530, loss: 0.0016520151402801275 2023-01-24 05:16:46.622838: step: 1924/530, loss: 0.005759743973612785 2023-01-24 05:16:47.686978: step: 1928/530, loss: 0.006398218683898449 2023-01-24 05:16:48.728564: step: 1932/530, loss: 0.05232980102300644 2023-01-24 05:16:49.766046: step: 1936/530, loss: 0.005682214628905058 2023-01-24 05:16:50.811837: step: 1940/530, loss: 0.008255409076809883 2023-01-24 05:16:51.845694: step: 1944/530, loss: 0.0038357547018676996 2023-01-24 05:16:52.898769: step: 1948/530, loss: 0.04414479807019234 2023-01-24 05:16:53.933405: step: 1952/530, loss: 0.009515609592199326 2023-01-24 05:16:55.005992: step: 1956/530, loss: 0.004789245780557394 2023-01-24 05:16:56.053742: step: 1960/530, loss: 0.008225589990615845 2023-01-24 05:16:57.099266: step: 1964/530, loss: 0.010477395728230476 2023-01-24 05:16:58.135724: step: 1968/530, loss: 0.005072738975286484 2023-01-24 05:16:59.169535: step: 1972/530, loss: 0.008390477858483791 2023-01-24 05:17:00.217328: step: 1976/530, loss: 0.007936930283904076 2023-01-24 05:17:01.243076: step: 1980/530, loss: 0.012791875749826431 2023-01-24 05:17:02.296189: step: 1984/530, loss: 0.02164677530527115 2023-01-24 05:17:03.341051: step: 1988/530, loss: 0.008725931867957115 2023-01-24 05:17:04.391257: step: 1992/530, loss: 0.01789635419845581 2023-01-24 05:17:05.454830: step: 1996/530, loss: 0.008945249952375889 2023-01-24 05:17:06.493969: step: 2000/530, loss: 0.00822716485708952 2023-01-24 05:17:07.514863: step: 2004/530, loss: 0.03890697658061981 2023-01-24 05:17:08.556777: step: 2008/530, loss: 0.002574681304395199 2023-01-24 05:17:09.610611: step: 2012/530, loss: 0.01289471983909607 2023-01-24 05:17:10.644374: step: 2016/530, loss: 0.017286738380789757 2023-01-24 05:17:11.671075: step: 2020/530, loss: 0.030664438381791115 2023-01-24 05:17:12.704424: step: 2024/530, loss: 0.0028441408649086952 2023-01-24 05:17:13.743929: step: 2028/530, loss: 0.005331079475581646 2023-01-24 05:17:14.780479: step: 2032/530, loss: 0.012977580539882183 2023-01-24 05:17:15.816023: step: 2036/530, loss: 0.0060233548283576965 2023-01-24 05:17:16.862136: step: 2040/530, loss: 0.020656533539295197 2023-01-24 05:17:17.892193: step: 2044/530, loss: 0.0485132671892643 2023-01-24 05:17:18.946405: step: 2048/530, loss: 0.0027876878157258034 2023-01-24 05:17:19.984031: step: 2052/530, loss: 0.0054365163668990135 2023-01-24 05:17:21.024497: step: 2056/530, loss: 0.008313395082950592 2023-01-24 05:17:22.069385: step: 2060/530, loss: 0.00732328649610281 2023-01-24 05:17:23.123272: step: 2064/530, loss: 0.01545261312276125 2023-01-24 05:17:24.173748: step: 2068/530, loss: 0.002826857380568981 2023-01-24 05:17:25.235400: step: 2072/530, loss: 0.008433181792497635 2023-01-24 05:17:26.286547: step: 2076/530, loss: 0.042273689061403275 2023-01-24 05:17:27.350469: step: 2080/530, loss: 0.012588677927851677 2023-01-24 05:17:28.389660: step: 2084/530, loss: 0.021031657233834267 2023-01-24 05:17:29.415225: step: 2088/530, loss: 0.06965355575084686 2023-01-24 05:17:30.465825: step: 2092/530, loss: 0.004588070325553417 2023-01-24 05:17:31.505105: step: 2096/530, loss: 0.005655618384480476 2023-01-24 05:17:32.566971: step: 2100/530, loss: 0.031774524599313736 2023-01-24 05:17:33.635390: step: 2104/530, loss: 0.0034075728617608547 2023-01-24 05:17:34.684918: step: 2108/530, loss: 0.07965991646051407 2023-01-24 05:17:35.750469: step: 2112/530, loss: 0.0087084099650383 2023-01-24 05:17:36.784776: step: 2116/530, loss: 0.006635582074522972 2023-01-24 05:17:37.841809: step: 2120/530, loss: 0.013546297326683998 ================================================== Loss: 0.015 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.36731085526315793, 'r': 0.3178249525616698, 'f1': 0.34078077314343846}, 'combined': 0.2511016223162178, 'stategy': 1, 'epoch': 1} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3751047802521255, 'r': 0.39096398971131463, 'f1': 0.3828702257478941}, 'combined': 0.29677022282851123, 'stategy': 1, 'epoch': 1} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3819074852163088, 'r': 0.33262910002710766, 'f1': 0.35556903796001166}, 'combined': 0.26199823849685067, 'stategy': 1, 'epoch': 1} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36785471839114864, 'r': 0.36616420957501283, 'f1': 0.36700751728937253}, 'combined': 0.2844747263199921, 'stategy': 1, 'epoch': 1} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 1} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 1} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} New best korean model... New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3738546380090498, 'r': 0.3135555028462998, 'f1': 0.34106037151702784}, 'combined': 0.25130764217044155, 'stategy': 1, 'epoch': 0} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36737558326918535, 'r': 0.3794979673183977, 'f1': 0.373338397064357}, 'combined': 0.28938191542787484, 'stategy': 1, 'epoch': 0} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 0} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3819074852163088, 'r': 0.33262910002710766, 'f1': 0.35556903796001166}, 'combined': 0.26199823849685067, 'stategy': 1, 'epoch': 1} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36785471839114864, 'r': 0.36616420957501283, 'f1': 0.36700751728937253}, 'combined': 0.2844747263199921, 'stategy': 1, 'epoch': 1} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 1} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 2 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 05:20:20.280315: step: 4/530, loss: 0.0037888602819293737 2023-01-24 05:20:21.309803: step: 8/530, loss: 0.002274070167914033 2023-01-24 05:20:22.335146: step: 12/530, loss: 0.004175004083663225 2023-01-24 05:20:23.362571: step: 16/530, loss: 0.012923570349812508 2023-01-24 05:20:24.378419: step: 20/530, loss: 0.04172271490097046 2023-01-24 05:20:25.432953: step: 24/530, loss: 0.0073312511667609215 2023-01-24 05:20:26.474932: step: 28/530, loss: 0.01263269130140543 2023-01-24 05:20:27.529195: step: 32/530, loss: 0.013178808614611626 2023-01-24 05:20:28.588381: step: 36/530, loss: 0.013025108724832535 2023-01-24 05:20:29.634108: step: 40/530, loss: 0.003801916493102908 2023-01-24 05:20:30.666494: step: 44/530, loss: 0.00686174351722002 2023-01-24 05:20:31.714362: step: 48/530, loss: 0.008977685123682022 2023-01-24 05:20:32.745191: step: 52/530, loss: 0.005197240971028805 2023-01-24 05:20:33.774404: step: 56/530, loss: 0.005364964250475168 2023-01-24 05:20:34.812672: step: 60/530, loss: 0.01704399101436138 2023-01-24 05:20:35.862312: step: 64/530, loss: 0.009992212988436222 2023-01-24 05:20:36.894827: step: 68/530, loss: 0.007765933871269226 2023-01-24 05:20:37.932713: step: 72/530, loss: 0.003925076685845852 2023-01-24 05:20:38.969359: step: 76/530, loss: 0.000541885441634804 2023-01-24 05:20:40.007658: step: 80/530, loss: 0.004293924663215876 2023-01-24 05:20:41.057415: step: 84/530, loss: 0.009389163926243782 2023-01-24 05:20:42.114566: step: 88/530, loss: 0.01748034916818142 2023-01-24 05:20:43.151632: step: 92/530, loss: 0.014097588136792183 2023-01-24 05:20:44.179588: step: 96/530, loss: 0.01041346974670887 2023-01-24 05:20:45.210081: step: 100/530, loss: 0.007205648813396692 2023-01-24 05:20:46.245478: step: 104/530, loss: 0.007947059348225594 2023-01-24 05:20:47.278664: step: 108/530, loss: 0.009083470329642296 2023-01-24 05:20:48.319439: step: 112/530, loss: 0.0061341156251728535 2023-01-24 05:20:49.352046: step: 116/530, loss: 0.015172949060797691 2023-01-24 05:20:50.398392: step: 120/530, loss: 0.009730362333357334 2023-01-24 05:20:51.446617: step: 124/530, loss: 0.005241116043180227 2023-01-24 05:20:52.481720: step: 128/530, loss: 0.005360835697501898 2023-01-24 05:20:53.516819: step: 132/530, loss: 0.008633263409137726 2023-01-24 05:20:54.552212: step: 136/530, loss: 0.015402628108859062 2023-01-24 05:20:55.598617: step: 140/530, loss: 0.03220726549625397 2023-01-24 05:20:56.664362: step: 144/530, loss: 0.0036236399319022894 2023-01-24 05:20:57.713855: step: 148/530, loss: 0.004044572357088327 2023-01-24 05:20:58.756462: step: 152/530, loss: 0.007374633569270372 2023-01-24 05:20:59.801689: step: 156/530, loss: 0.009039615280926228 2023-01-24 05:21:00.854813: step: 160/530, loss: 0.011822286993265152 2023-01-24 05:21:01.893076: step: 164/530, loss: 0.013853204436600208 2023-01-24 05:21:02.942833: step: 168/530, loss: 0.00663926312699914 2023-01-24 05:21:03.983026: step: 172/530, loss: 0.002951239701360464 2023-01-24 05:21:05.044927: step: 176/530, loss: 0.014926016330718994 2023-01-24 05:21:06.072147: step: 180/530, loss: 0.004300619941204786 2023-01-24 05:21:07.119110: step: 184/530, loss: 0.0028859772719442844 2023-01-24 05:21:08.181225: step: 188/530, loss: 0.009648839943110943 2023-01-24 05:21:09.227583: step: 192/530, loss: 0.005239957477897406 2023-01-24 05:21:10.276264: step: 196/530, loss: 0.01581951417028904 2023-01-24 05:21:11.335286: step: 200/530, loss: 0.005738834384828806 2023-01-24 05:21:12.394084: step: 204/530, loss: 0.006783826742321253 2023-01-24 05:21:13.426504: step: 208/530, loss: 0.015379020012915134 2023-01-24 05:21:14.461073: step: 212/530, loss: 0.00494582811370492 2023-01-24 05:21:15.505768: step: 216/530, loss: 0.004406896885484457 2023-01-24 05:21:16.565174: step: 220/530, loss: 0.039395347237586975 2023-01-24 05:21:17.613132: step: 224/530, loss: 0.015137819573283195 2023-01-24 05:21:18.674126: step: 228/530, loss: 0.008169913664460182 2023-01-24 05:21:19.737652: step: 232/530, loss: 0.08331502974033356 2023-01-24 05:21:20.783976: step: 236/530, loss: 0.012254470027983189 2023-01-24 05:21:21.812417: step: 240/530, loss: 0.003868556348606944 2023-01-24 05:21:22.857668: step: 244/530, loss: 0.0060865022242069244 2023-01-24 05:21:23.911750: step: 248/530, loss: 0.003737794002518058 2023-01-24 05:21:24.954092: step: 252/530, loss: 0.010138806886970997 2023-01-24 05:21:26.008992: step: 256/530, loss: 0.010617443360388279 2023-01-24 05:21:27.034052: step: 260/530, loss: 0.003966417163610458 2023-01-24 05:21:28.081681: step: 264/530, loss: 0.007853623479604721 2023-01-24 05:21:29.125911: step: 268/530, loss: 0.0021429879125207663 2023-01-24 05:21:30.168202: step: 272/530, loss: 0.03301749378442764 2023-01-24 05:21:31.203034: step: 276/530, loss: 0.009293826296925545 2023-01-24 05:21:32.255316: step: 280/530, loss: 0.0011327870888635516 2023-01-24 05:21:33.320581: step: 284/530, loss: 0.003882062854245305 2023-01-24 05:21:34.387821: step: 288/530, loss: 0.0051101697608828545 2023-01-24 05:21:35.429504: step: 292/530, loss: 0.002720510819926858 2023-01-24 05:21:36.476116: step: 296/530, loss: 0.015062347054481506 2023-01-24 05:21:37.518403: step: 300/530, loss: 0.011983749456703663 2023-01-24 05:21:38.576425: step: 304/530, loss: 0.004484365228563547 2023-01-24 05:21:39.633291: step: 308/530, loss: 0.017877696081995964 2023-01-24 05:21:40.681140: step: 312/530, loss: 0.021055176854133606 2023-01-24 05:21:41.724908: step: 316/530, loss: 0.005788861308246851 2023-01-24 05:21:42.771472: step: 320/530, loss: 0.00951676070690155 2023-01-24 05:21:43.812643: step: 324/530, loss: 0.008682755753397942 2023-01-24 05:21:44.852186: step: 328/530, loss: 0.005156229715794325 2023-01-24 05:21:45.895073: step: 332/530, loss: 0.010274766944348812 2023-01-24 05:21:46.948375: step: 336/530, loss: 0.007740643806755543 2023-01-24 05:21:47.994016: step: 340/530, loss: 0.007301523350179195 2023-01-24 05:21:49.039955: step: 344/530, loss: 0.0040678647346794605 2023-01-24 05:21:50.099306: step: 348/530, loss: 0.0038683817256242037 2023-01-24 05:21:51.158362: step: 352/530, loss: 0.014949017204344273 2023-01-24 05:21:52.193689: step: 356/530, loss: 0.014149488881230354 2023-01-24 05:21:53.236270: step: 360/530, loss: 0.0299299955368042 2023-01-24 05:21:54.270599: step: 364/530, loss: 0.015602793544530869 2023-01-24 05:21:55.326688: step: 368/530, loss: 0.013038051314651966 2023-01-24 05:21:56.363659: step: 372/530, loss: 0.00841568410396576 2023-01-24 05:21:57.418181: step: 376/530, loss: 0.04445348307490349 2023-01-24 05:21:58.465929: step: 380/530, loss: 0.012290619313716888 2023-01-24 05:21:59.515590: step: 384/530, loss: 0.020278410986065865 2023-01-24 05:22:00.557179: step: 388/530, loss: 0.053476482629776 2023-01-24 05:22:01.608868: step: 392/530, loss: 0.017562100663781166 2023-01-24 05:22:02.662524: step: 396/530, loss: 0.022115476429462433 2023-01-24 05:22:03.731543: step: 400/530, loss: 0.015994062647223473 2023-01-24 05:22:04.782969: step: 404/530, loss: 0.08731957525014877 2023-01-24 05:22:05.841066: step: 408/530, loss: 0.013568167574703693 2023-01-24 05:22:06.875248: step: 412/530, loss: 0.018604643642902374 2023-01-24 05:22:07.931735: step: 416/530, loss: 0.006680516991764307 2023-01-24 05:22:08.984012: step: 420/530, loss: 0.027568768709897995 2023-01-24 05:22:10.040683: step: 424/530, loss: 0.02251289039850235 2023-01-24 05:22:11.089794: step: 428/530, loss: 0.005960583686828613 2023-01-24 05:22:12.162797: step: 432/530, loss: 0.017948690801858902 2023-01-24 05:22:13.205850: step: 436/530, loss: 0.01131599210202694 2023-01-24 05:22:14.259447: step: 440/530, loss: 0.032078713178634644 2023-01-24 05:22:15.316510: step: 444/530, loss: 0.032719556242227554 2023-01-24 05:22:16.361698: step: 448/530, loss: 0.00150158756878227 2023-01-24 05:22:17.405630: step: 452/530, loss: 0.014419044367969036 2023-01-24 05:22:18.467807: step: 456/530, loss: 0.01792624033987522 2023-01-24 05:22:19.516233: step: 460/530, loss: 0.0016940251225605607 2023-01-24 05:22:20.559887: step: 464/530, loss: 0.0064159780740737915 2023-01-24 05:22:21.599456: step: 468/530, loss: 0.010302126407623291 2023-01-24 05:22:22.657070: step: 472/530, loss: 0.01843603141605854 2023-01-24 05:22:23.706921: step: 476/530, loss: 0.002535809064283967 2023-01-24 05:22:24.743424: step: 480/530, loss: 0.008340365253388882 2023-01-24 05:22:25.784322: step: 484/530, loss: 0.036069102585315704 2023-01-24 05:22:26.836065: step: 488/530, loss: 0.003325577126815915 2023-01-24 05:22:27.890521: step: 492/530, loss: 0.0027209504041820765 2023-01-24 05:22:28.941802: step: 496/530, loss: 0.05793335661292076 2023-01-24 05:22:29.984472: step: 500/530, loss: 0.021056879311800003 2023-01-24 05:22:31.039702: step: 504/530, loss: 0.010850130580365658 2023-01-24 05:22:32.096423: step: 508/530, loss: 0.03423653542995453 2023-01-24 05:22:33.149450: step: 512/530, loss: 0.008309063501656055 2023-01-24 05:22:34.185062: step: 516/530, loss: 0.015190846286714077 2023-01-24 05:22:35.242756: step: 520/530, loss: 0.03745207563042641 2023-01-24 05:22:36.291919: step: 524/530, loss: 0.015186917036771774 2023-01-24 05:22:37.339690: step: 528/530, loss: 0.004568911623209715 2023-01-24 05:22:38.382415: step: 532/530, loss: 0.011096176691353321 2023-01-24 05:22:39.426730: step: 536/530, loss: 0.004400535020977259 2023-01-24 05:22:40.468829: step: 540/530, loss: 0.0 2023-01-24 05:22:41.501057: step: 544/530, loss: 0.01683727838099003 2023-01-24 05:22:42.559606: step: 548/530, loss: 0.007855606265366077 2023-01-24 05:22:43.613948: step: 552/530, loss: 0.044630225747823715 2023-01-24 05:22:44.670634: step: 556/530, loss: 0.02824886329472065 2023-01-24 05:22:45.720360: step: 560/530, loss: 0.0037639860529452562 2023-01-24 05:22:46.782129: step: 564/530, loss: 0.00352419912815094 2023-01-24 05:22:47.823131: step: 568/530, loss: 0.0031005952041596174 2023-01-24 05:22:48.865596: step: 572/530, loss: 0.005644264630973339 2023-01-24 05:22:49.918011: step: 576/530, loss: 0.030470222234725952 2023-01-24 05:22:50.980287: step: 580/530, loss: 0.007264934480190277 2023-01-24 05:22:52.031936: step: 584/530, loss: 0.0066889189183712006 2023-01-24 05:22:53.100732: step: 588/530, loss: 0.024554580450057983 2023-01-24 05:22:54.136118: step: 592/530, loss: 0.01446685940027237 2023-01-24 05:22:55.191261: step: 596/530, loss: 0.01411527581512928 2023-01-24 05:22:56.239621: step: 600/530, loss: 0.040842704474925995 2023-01-24 05:22:57.287250: step: 604/530, loss: 0.006944156717509031 2023-01-24 05:22:58.335425: step: 608/530, loss: 0.007428456097841263 2023-01-24 05:22:59.379877: step: 612/530, loss: 0.007626347243785858 2023-01-24 05:23:00.444819: step: 616/530, loss: 0.00712672108784318 2023-01-24 05:23:01.484168: step: 620/530, loss: 0.014052527025341988 2023-01-24 05:23:02.523863: step: 624/530, loss: 0.03125925734639168 2023-01-24 05:23:03.562958: step: 628/530, loss: 0.01052032969892025 2023-01-24 05:23:04.613775: step: 632/530, loss: 0.0023417561315000057 2023-01-24 05:23:05.669283: step: 636/530, loss: 0.038041893392801285 2023-01-24 05:23:06.724597: step: 640/530, loss: 0.05661146342754364 2023-01-24 05:23:07.776557: step: 644/530, loss: 0.005648643709719181 2023-01-24 05:23:08.843655: step: 648/530, loss: 0.010237081907689571 2023-01-24 05:23:09.909165: step: 652/530, loss: 0.06403376162052155 2023-01-24 05:23:10.976698: step: 656/530, loss: 0.004555267747491598 2023-01-24 05:23:12.021460: step: 660/530, loss: 0.006625948939472437 2023-01-24 05:23:13.079763: step: 664/530, loss: 0.015173325315117836 2023-01-24 05:23:14.118608: step: 668/530, loss: 0.000659630517475307 2023-01-24 05:23:15.177606: step: 672/530, loss: 0.019146470353007317 2023-01-24 05:23:16.231666: step: 676/530, loss: 0.0082447724416852 2023-01-24 05:23:17.286472: step: 680/530, loss: 0.010350859723985195 2023-01-24 05:23:18.331435: step: 684/530, loss: 0.004582496359944344 2023-01-24 05:23:19.374539: step: 688/530, loss: 0.0015153058338910341 2023-01-24 05:23:20.425468: step: 692/530, loss: 0.0077805654145777225 2023-01-24 05:23:21.468597: step: 696/530, loss: 0.00929328054189682 2023-01-24 05:23:22.544296: step: 700/530, loss: 0.004751413129270077 2023-01-24 05:23:23.594387: step: 704/530, loss: 0.016598748043179512 2023-01-24 05:23:24.651761: step: 708/530, loss: 0.009224177338182926 2023-01-24 05:23:25.696155: step: 712/530, loss: 0.0027216775342822075 2023-01-24 05:23:26.741766: step: 716/530, loss: 0.007163349539041519 2023-01-24 05:23:27.788790: step: 720/530, loss: 0.007957649417221546 2023-01-24 05:23:28.841252: step: 724/530, loss: 0.011768410913646221 2023-01-24 05:23:29.891298: step: 728/530, loss: 0.003944066818803549 2023-01-24 05:23:30.949893: step: 732/530, loss: 0.056393641978502274 2023-01-24 05:23:31.990493: step: 736/530, loss: 0.011592704802751541 2023-01-24 05:23:33.036462: step: 740/530, loss: 0.005546966101974249 2023-01-24 05:23:34.071577: step: 744/530, loss: 0.0048983097076416016 2023-01-24 05:23:35.120336: step: 748/530, loss: 0.005409256089478731 2023-01-24 05:23:36.169161: step: 752/530, loss: 0.009478812105953693 2023-01-24 05:23:37.218281: step: 756/530, loss: 0.013316327705979347 2023-01-24 05:23:38.255582: step: 760/530, loss: 0.00597356166690588 2023-01-24 05:23:39.325697: step: 764/530, loss: 0.004640889819711447 2023-01-24 05:23:40.385490: step: 768/530, loss: 0.004776876885443926 2023-01-24 05:23:41.426166: step: 772/530, loss: 0.0035329554229974747 2023-01-24 05:23:42.475164: step: 776/530, loss: 0.015949275344610214 2023-01-24 05:23:43.531795: step: 780/530, loss: 0.005042117089033127 2023-01-24 05:23:44.575728: step: 784/530, loss: 0.005862420424818993 2023-01-24 05:23:45.608261: step: 788/530, loss: 0.00669389171525836 2023-01-24 05:23:46.661225: step: 792/530, loss: 0.011051834560930729 2023-01-24 05:23:47.704808: step: 796/530, loss: 0.003256085328757763 2023-01-24 05:23:48.752485: step: 800/530, loss: 0.006045700516551733 2023-01-24 05:23:49.801384: step: 804/530, loss: 0.007932779379189014 2023-01-24 05:23:50.846489: step: 808/530, loss: 0.008154944516718388 2023-01-24 05:23:51.909412: step: 812/530, loss: 0.009056208655238152 2023-01-24 05:23:52.952137: step: 816/530, loss: 0.013150123879313469 2023-01-24 05:23:53.997713: step: 820/530, loss: 0.008306847885251045 2023-01-24 05:23:55.057875: step: 824/530, loss: 0.021365325897932053 2023-01-24 05:23:56.129222: step: 828/530, loss: 0.0075383419170975685 2023-01-24 05:23:57.175665: step: 832/530, loss: 0.0068174246698617935 2023-01-24 05:23:58.218536: step: 836/530, loss: 0.00420548627153039 2023-01-24 05:23:59.253502: step: 840/530, loss: 0.015030053444206715 2023-01-24 05:24:00.293561: step: 844/530, loss: 0.005739784333854914 2023-01-24 05:24:01.346030: step: 848/530, loss: 0.012050241231918335 2023-01-24 05:24:02.384269: step: 852/530, loss: 0.0020066951401531696 2023-01-24 05:24:03.456836: step: 856/530, loss: 0.009453263133764267 2023-01-24 05:24:04.504383: step: 860/530, loss: 0.008722888305783272 2023-01-24 05:24:05.554369: step: 864/530, loss: 0.006742542143911123 2023-01-24 05:24:06.609253: step: 868/530, loss: 0.004183107055723667 2023-01-24 05:24:07.660064: step: 872/530, loss: 0.004332275129854679 2023-01-24 05:24:08.719512: step: 876/530, loss: 0.011938884854316711 2023-01-24 05:24:09.774162: step: 880/530, loss: 0.008039558306336403 2023-01-24 05:24:10.804045: step: 884/530, loss: 0.012793056666851044 2023-01-24 05:24:11.844260: step: 888/530, loss: 0.00379876303486526 2023-01-24 05:24:12.900631: step: 892/530, loss: 0.03832479566335678 2023-01-24 05:24:13.962946: step: 896/530, loss: 0.010300673544406891 2023-01-24 05:24:15.006807: step: 900/530, loss: 0.03753114119172096 2023-01-24 05:24:16.063290: step: 904/530, loss: 0.01747182384133339 2023-01-24 05:24:17.103916: step: 908/530, loss: 0.0008860359666869044 2023-01-24 05:24:18.173896: step: 912/530, loss: 0.006400313228368759 2023-01-24 05:24:19.213369: step: 916/530, loss: 0.01691780611872673 2023-01-24 05:24:20.278037: step: 920/530, loss: 0.08044847846031189 2023-01-24 05:24:21.321237: step: 924/530, loss: 0.007671186234802008 2023-01-24 05:24:22.397901: step: 928/530, loss: 0.004856127314269543 2023-01-24 05:24:23.444033: step: 932/530, loss: 0.0024805711582303047 2023-01-24 05:24:24.517800: step: 936/530, loss: 0.007052455563098192 2023-01-24 05:24:25.565380: step: 940/530, loss: 0.018911350518465042 2023-01-24 05:24:26.607262: step: 944/530, loss: 0.009532704949378967 2023-01-24 05:24:27.649260: step: 948/530, loss: 0.012691096402704716 2023-01-24 05:24:28.692273: step: 952/530, loss: 0.008381885476410389 2023-01-24 05:24:29.735125: step: 956/530, loss: 0.0026562383864074945 2023-01-24 05:24:30.773281: step: 960/530, loss: 0.003332835389301181 2023-01-24 05:24:31.824006: step: 964/530, loss: 0.00530997384339571 2023-01-24 05:24:32.868907: step: 968/530, loss: 0.0006700890953652561 2023-01-24 05:24:33.932746: step: 972/530, loss: 0.0058180964551866055 2023-01-24 05:24:34.985230: step: 976/530, loss: 0.005701414309442043 2023-01-24 05:24:36.020520: step: 980/530, loss: 0.001955924555659294 2023-01-24 05:24:37.062191: step: 984/530, loss: 0.024068683385849 2023-01-24 05:24:38.111050: step: 988/530, loss: 0.0031588070560246706 2023-01-24 05:24:39.163970: step: 992/530, loss: 0.00401584105566144 2023-01-24 05:24:40.229004: step: 996/530, loss: 0.005481899715960026 2023-01-24 05:24:41.279547: step: 1000/530, loss: 0.010975665412843227 2023-01-24 05:24:42.314489: step: 1004/530, loss: 0.0035874273162335157 2023-01-24 05:24:43.362611: step: 1008/530, loss: 0.005873409099876881 2023-01-24 05:24:44.398616: step: 1012/530, loss: 0.0036414589267224073 2023-01-24 05:24:45.448830: step: 1016/530, loss: 0.0025522729847580194 2023-01-24 05:24:46.528512: step: 1020/530, loss: 0.013500872068107128 2023-01-24 05:24:47.579512: step: 1024/530, loss: 0.01034728717058897 2023-01-24 05:24:48.624800: step: 1028/530, loss: 0.010017571970820427 2023-01-24 05:24:49.673293: step: 1032/530, loss: 0.006204309407621622 2023-01-24 05:24:50.718346: step: 1036/530, loss: 0.006021259818226099 2023-01-24 05:24:51.763789: step: 1040/530, loss: 0.002929095411673188 2023-01-24 05:24:52.812024: step: 1044/530, loss: 0.010702336207032204 2023-01-24 05:24:53.880918: step: 1048/530, loss: 0.017417805269360542 2023-01-24 05:24:54.932832: step: 1052/530, loss: 0.024475088343024254 2023-01-24 05:24:55.973484: step: 1056/530, loss: 0.003840898396447301 2023-01-24 05:24:57.018158: step: 1060/530, loss: 0.004448775202035904 2023-01-24 05:24:58.069235: step: 1064/530, loss: 0.011634442955255508 2023-01-24 05:24:59.095493: step: 1068/530, loss: 0.008896343410015106 2023-01-24 05:25:00.163874: step: 1072/530, loss: 0.0029097062069922686 2023-01-24 05:25:01.213673: step: 1076/530, loss: 0.005392597522586584 2023-01-24 05:25:02.280887: step: 1080/530, loss: 0.03362016752362251 2023-01-24 05:25:03.333456: step: 1084/530, loss: 0.008171535097062588 2023-01-24 05:25:04.404335: step: 1088/530, loss: 0.0062361485324800014 2023-01-24 05:25:05.461665: step: 1092/530, loss: 0.014005381613969803 2023-01-24 05:25:06.505783: step: 1096/530, loss: 0.004480735398828983 2023-01-24 05:25:07.553368: step: 1100/530, loss: 0.00035368840326555073 2023-01-24 05:25:08.604272: step: 1104/530, loss: 0.024342549964785576 2023-01-24 05:25:09.656616: step: 1108/530, loss: 0.004262437578290701 2023-01-24 05:25:10.707229: step: 1112/530, loss: 0.012259361334145069 2023-01-24 05:25:11.753565: step: 1116/530, loss: 0.014585102908313274 2023-01-24 05:25:12.799726: step: 1120/530, loss: 0.00612040376290679 2023-01-24 05:25:13.836894: step: 1124/530, loss: 0.002209411235526204 2023-01-24 05:25:14.884163: step: 1128/530, loss: 0.05484972894191742 2023-01-24 05:25:15.935408: step: 1132/530, loss: 0.0029807996470481157 2023-01-24 05:25:16.985016: step: 1136/530, loss: 0.0065013933926820755 2023-01-24 05:25:18.048379: step: 1140/530, loss: 0.03368424251675606 2023-01-24 05:25:19.079252: step: 1144/530, loss: 0.0046228389255702496 2023-01-24 05:25:20.104315: step: 1148/530, loss: 0.0 2023-01-24 05:25:21.168599: step: 1152/530, loss: 0.00875432975590229 2023-01-24 05:25:22.210349: step: 1156/530, loss: 0.016462694853544235 2023-01-24 05:25:23.262894: step: 1160/530, loss: 0.02316376380622387 2023-01-24 05:25:24.307457: step: 1164/530, loss: 0.004688203800469637 2023-01-24 05:25:25.374918: step: 1168/530, loss: 0.0018599749309942126 2023-01-24 05:25:26.443569: step: 1172/530, loss: 0.014798082411289215 2023-01-24 05:25:27.497936: step: 1176/530, loss: 0.013131591491401196 2023-01-24 05:25:28.551773: step: 1180/530, loss: 0.0017979169497266412 2023-01-24 05:25:29.605957: step: 1184/530, loss: 0.005597659386694431 2023-01-24 05:25:30.656164: step: 1188/530, loss: 0.058025751262903214 2023-01-24 05:25:31.719966: step: 1192/530, loss: 0.009247376583516598 2023-01-24 05:25:32.751610: step: 1196/530, loss: 0.014901560731232166 2023-01-24 05:25:33.792159: step: 1200/530, loss: 0.0023767035454511642 2023-01-24 05:25:34.837006: step: 1204/530, loss: 0.0117331612855196 2023-01-24 05:25:35.869170: step: 1208/530, loss: 0.007630191743373871 2023-01-24 05:25:36.920733: step: 1212/530, loss: 0.011550309136509895 2023-01-24 05:25:37.961745: step: 1216/530, loss: 0.025422869250178337 2023-01-24 05:25:39.014764: step: 1220/530, loss: 0.008089822717010975 2023-01-24 05:25:40.060239: step: 1224/530, loss: 0.005569732282310724 2023-01-24 05:25:41.115872: step: 1228/530, loss: 0.009212653152644634 2023-01-24 05:25:42.153188: step: 1232/530, loss: 0.004605633672326803 2023-01-24 05:25:43.197807: step: 1236/530, loss: 0.003863939084112644 2023-01-24 05:25:44.233706: step: 1240/530, loss: 0.01663948781788349 2023-01-24 05:25:45.264900: step: 1244/530, loss: 0.0005199595470912755 2023-01-24 05:25:46.309413: step: 1248/530, loss: 0.006381301674991846 2023-01-24 05:25:47.348092: step: 1252/530, loss: 0.013552563264966011 2023-01-24 05:25:48.395504: step: 1256/530, loss: 0.027677103877067566 2023-01-24 05:25:49.442411: step: 1260/530, loss: 0.005271045491099358 2023-01-24 05:25:50.487929: step: 1264/530, loss: 0.0034594007302075624 2023-01-24 05:25:51.549975: step: 1268/530, loss: 0.017985286191105843 2023-01-24 05:25:52.584793: step: 1272/530, loss: 0.008233219385147095 2023-01-24 05:25:53.630817: step: 1276/530, loss: 0.003561665304005146 2023-01-24 05:25:54.661754: step: 1280/530, loss: 0.0040474990382790565 2023-01-24 05:25:55.713795: step: 1284/530, loss: 0.008383186534047127 2023-01-24 05:25:56.766921: step: 1288/530, loss: 0.04187886416912079 2023-01-24 05:25:57.808252: step: 1292/530, loss: 0.009270424954593182 2023-01-24 05:25:58.845061: step: 1296/530, loss: 0.009301802143454552 2023-01-24 05:25:59.894178: step: 1300/530, loss: 0.007039169780910015 2023-01-24 05:26:00.948559: step: 1304/530, loss: 0.006889335345476866 2023-01-24 05:26:01.998133: step: 1308/530, loss: 0.008197125978767872 2023-01-24 05:26:03.037182: step: 1312/530, loss: 0.001126836403273046 2023-01-24 05:26:04.069934: step: 1316/530, loss: 0.006413801107555628 2023-01-24 05:26:05.114498: step: 1320/530, loss: 0.047761209309101105 2023-01-24 05:26:06.156262: step: 1324/530, loss: 0.0010622147237882018 2023-01-24 05:26:07.214171: step: 1328/530, loss: 0.006086141336709261 2023-01-24 05:26:08.277024: step: 1332/530, loss: 0.06170609965920448 2023-01-24 05:26:09.323490: step: 1336/530, loss: 0.003733492223545909 2023-01-24 05:26:10.386786: step: 1340/530, loss: 0.006471488159149885 2023-01-24 05:26:11.424750: step: 1344/530, loss: 0.010077622719109058 2023-01-24 05:26:12.473925: step: 1348/530, loss: 0.015354132279753685 2023-01-24 05:26:13.515193: step: 1352/530, loss: 0.009535085409879684 2023-01-24 05:26:14.565846: step: 1356/530, loss: 0.004882055334746838 2023-01-24 05:26:15.604845: step: 1360/530, loss: 0.029433147981762886 2023-01-24 05:26:16.656535: step: 1364/530, loss: 0.008147753775119781 2023-01-24 05:26:17.704048: step: 1368/530, loss: 0.006073904689401388 2023-01-24 05:26:18.768915: step: 1372/530, loss: 0.01107755582779646 2023-01-24 05:26:19.822998: step: 1376/530, loss: 0.002783454954624176 2023-01-24 05:26:20.857630: step: 1380/530, loss: 0.0037271399050951004 2023-01-24 05:26:21.904378: step: 1384/530, loss: 0.002598479390144348 2023-01-24 05:26:22.967172: step: 1388/530, loss: 0.02149217016994953 2023-01-24 05:26:24.003167: step: 1392/530, loss: 0.004607797600328922 2023-01-24 05:26:25.038971: step: 1396/530, loss: 0.0 2023-01-24 05:26:26.075491: step: 1400/530, loss: 0.025173932313919067 2023-01-24 05:26:27.112455: step: 1404/530, loss: 0.006708444561809301 2023-01-24 05:26:28.141066: step: 1408/530, loss: 0.031152212992310524 2023-01-24 05:26:29.172227: step: 1412/530, loss: 0.008127504028379917 2023-01-24 05:26:30.215603: step: 1416/530, loss: 0.007615264039486647 2023-01-24 05:26:31.258382: step: 1420/530, loss: 0.004270453471690416 2023-01-24 05:26:32.327782: step: 1424/530, loss: 0.005471104755997658 2023-01-24 05:26:33.385562: step: 1428/530, loss: 0.01035796944051981 2023-01-24 05:26:34.436582: step: 1432/530, loss: 0.008425642736256123 2023-01-24 05:26:35.492317: step: 1436/530, loss: 0.01042137574404478 2023-01-24 05:26:36.538087: step: 1440/530, loss: 0.00039081694558262825 2023-01-24 05:26:37.579869: step: 1444/530, loss: 0.007506794296205044 2023-01-24 05:26:38.615624: step: 1448/530, loss: 0.0031182970851659775 2023-01-24 05:26:39.655094: step: 1452/530, loss: 0.0005422660033218563 2023-01-24 05:26:40.691979: step: 1456/530, loss: 0.004031767603009939 2023-01-24 05:26:41.728264: step: 1460/530, loss: 0.005994164850562811 2023-01-24 05:26:42.755130: step: 1464/530, loss: 0.0005023129051551223 2023-01-24 05:26:43.814996: step: 1468/530, loss: 0.012664709240198135 2023-01-24 05:26:44.848724: step: 1472/530, loss: 0.049943484365940094 2023-01-24 05:26:45.885170: step: 1476/530, loss: 0.0015420836862176657 2023-01-24 05:26:46.928976: step: 1480/530, loss: 0.0033133160322904587 2023-01-24 05:26:47.965452: step: 1484/530, loss: 0.00653122179210186 2023-01-24 05:26:49.006472: step: 1488/530, loss: 0.007186573464423418 2023-01-24 05:26:50.057580: step: 1492/530, loss: 0.011969853192567825 2023-01-24 05:26:51.102463: step: 1496/530, loss: 0.014530536718666553 2023-01-24 05:26:52.150594: step: 1500/530, loss: 0.006307149305939674 2023-01-24 05:26:53.197128: step: 1504/530, loss: 0.003479381324723363 2023-01-24 05:26:54.236943: step: 1508/530, loss: 0.011177916079759598 2023-01-24 05:26:55.283443: step: 1512/530, loss: 0.005139518994837999 2023-01-24 05:26:56.337545: step: 1516/530, loss: 0.0006295983912423253 2023-01-24 05:26:57.384055: step: 1520/530, loss: 0.006515598390251398 2023-01-24 05:26:58.425779: step: 1524/530, loss: 0.002554867882281542 2023-01-24 05:26:59.467266: step: 1528/530, loss: 0.008377340622246265 2023-01-24 05:27:00.517474: step: 1532/530, loss: 0.05783534795045853 2023-01-24 05:27:01.545592: step: 1536/530, loss: 0.005389595869928598 2023-01-24 05:27:02.571393: step: 1540/530, loss: 0.007903750985860825 2023-01-24 05:27:03.632981: step: 1544/530, loss: 0.0038705479819327593 2023-01-24 05:27:04.678966: step: 1548/530, loss: 0.028735095635056496 2023-01-24 05:27:05.735832: step: 1552/530, loss: 0.005190129857510328 2023-01-24 05:27:06.791420: step: 1556/530, loss: 0.021424822509288788 2023-01-24 05:27:07.850926: step: 1560/530, loss: 0.008036785759031773 2023-01-24 05:27:08.914277: step: 1564/530, loss: 0.04125150665640831 2023-01-24 05:27:09.949222: step: 1568/530, loss: 0.00927783828228712 2023-01-24 05:27:10.980372: step: 1572/530, loss: 0.011850586161017418 2023-01-24 05:27:12.026499: step: 1576/530, loss: 0.005020054988563061 2023-01-24 05:27:13.082194: step: 1580/530, loss: 0.003278045216575265 2023-01-24 05:27:14.129085: step: 1584/530, loss: 0.031927503645420074 2023-01-24 05:27:15.164141: step: 1588/530, loss: 0.026801520958542824 2023-01-24 05:27:16.211176: step: 1592/530, loss: 0.003425628412514925 2023-01-24 05:27:17.247158: step: 1596/530, loss: 0.049877263605594635 2023-01-24 05:27:18.299381: step: 1600/530, loss: 0.006141694262623787 2023-01-24 05:27:19.378405: step: 1604/530, loss: 0.006621780805289745 2023-01-24 05:27:20.416567: step: 1608/530, loss: 0.007877185009419918 2023-01-24 05:27:21.448711: step: 1612/530, loss: 0.0021937566343694925 2023-01-24 05:27:22.491477: step: 1616/530, loss: 0.006378753576427698 2023-01-24 05:27:23.534949: step: 1620/530, loss: 0.011783838272094727 2023-01-24 05:27:24.571569: step: 1624/530, loss: 0.015877580270171165 2023-01-24 05:27:25.604883: step: 1628/530, loss: 0.00994875468313694 2023-01-24 05:27:26.643901: step: 1632/530, loss: 0.00414926465600729 2023-01-24 05:27:27.699163: step: 1636/530, loss: 0.003867295803502202 2023-01-24 05:27:28.756444: step: 1640/530, loss: 0.027900317683815956 2023-01-24 05:27:29.808981: step: 1644/530, loss: 0.053811896592378616 2023-01-24 05:27:30.863330: step: 1648/530, loss: 0.060002632439136505 2023-01-24 05:27:31.914980: step: 1652/530, loss: 0.029271814972162247 2023-01-24 05:27:32.944891: step: 1656/530, loss: 0.011379271745681763 2023-01-24 05:27:33.988653: step: 1660/530, loss: 0.012634336948394775 2023-01-24 05:27:35.017624: step: 1664/530, loss: 0.0009583713253960013 2023-01-24 05:27:36.054170: step: 1668/530, loss: 0.015642007812857628 2023-01-24 05:27:37.081485: step: 1672/530, loss: 0.0030116497073322535 2023-01-24 05:27:38.132560: step: 1676/530, loss: 0.004310282878577709 2023-01-24 05:27:39.172022: step: 1680/530, loss: 0.0039841230027377605 2023-01-24 05:27:40.204338: step: 1684/530, loss: 0.0407322533428669 2023-01-24 05:27:41.232747: step: 1688/530, loss: 0.038015179336071014 2023-01-24 05:27:42.294398: step: 1692/530, loss: 0.0069891661405563354 2023-01-24 05:27:43.335096: step: 1696/530, loss: 0.11138701438903809 2023-01-24 05:27:44.379353: step: 1700/530, loss: 0.019396452233195305 2023-01-24 05:27:45.441716: step: 1704/530, loss: 0.01320500485599041 2023-01-24 05:27:46.490949: step: 1708/530, loss: 0.03175336495041847 2023-01-24 05:27:47.531280: step: 1712/530, loss: 0.006625065114349127 2023-01-24 05:27:48.554152: step: 1716/530, loss: 0.004687377251684666 2023-01-24 05:27:49.592757: step: 1720/530, loss: 0.04952029883861542 2023-01-24 05:27:50.642248: step: 1724/530, loss: 0.07533345371484756 2023-01-24 05:27:51.692650: step: 1728/530, loss: 0.01125490665435791 2023-01-24 05:27:52.720130: step: 1732/530, loss: 0.00745021877810359 2023-01-24 05:27:53.761610: step: 1736/530, loss: 0.037051569670438766 2023-01-24 05:27:54.800847: step: 1740/530, loss: 0.01379351131618023 2023-01-24 05:27:55.846541: step: 1744/530, loss: 0.008265962824225426 2023-01-24 05:27:56.877429: step: 1748/530, loss: 0.00685100955888629 2023-01-24 05:27:57.912278: step: 1752/530, loss: 0.026263441890478134 2023-01-24 05:27:58.953741: step: 1756/530, loss: 0.032217733561992645 2023-01-24 05:28:00.024493: step: 1760/530, loss: 0.008177057839930058 2023-01-24 05:28:01.049688: step: 1764/530, loss: 0.005513209383934736 2023-01-24 05:28:02.073938: step: 1768/530, loss: 0.0 2023-01-24 05:28:03.147068: step: 1772/530, loss: 0.06811343878507614 2023-01-24 05:28:04.195762: step: 1776/530, loss: 0.013587906956672668 2023-01-24 05:28:05.243441: step: 1780/530, loss: 0.05199526995420456 2023-01-24 05:28:06.290308: step: 1784/530, loss: 0.0057129389606416225 2023-01-24 05:28:07.346503: step: 1788/530, loss: 0.007696868851780891 2023-01-24 05:28:08.381104: step: 1792/530, loss: 0.014432776719331741 2023-01-24 05:28:09.443235: step: 1796/530, loss: 0.016515566036105156 2023-01-24 05:28:10.481325: step: 1800/530, loss: 0.005326796788722277 2023-01-24 05:28:11.525178: step: 1804/530, loss: 0.010185799561440945 2023-01-24 05:28:12.567368: step: 1808/530, loss: 0.01364689040929079 2023-01-24 05:28:13.605427: step: 1812/530, loss: 0.07476868480443954 2023-01-24 05:28:14.643898: step: 1816/530, loss: 0.0037018347065895796 2023-01-24 05:28:15.684132: step: 1820/530, loss: 0.005702932830899954 2023-01-24 05:28:16.744681: step: 1824/530, loss: 0.07156221568584442 2023-01-24 05:28:17.787828: step: 1828/530, loss: 0.0053881024941802025 2023-01-24 05:28:18.823295: step: 1832/530, loss: 0.006276683881878853 2023-01-24 05:28:19.859204: step: 1836/530, loss: 0.010244112461805344 2023-01-24 05:28:20.908046: step: 1840/530, loss: 0.008763822726905346 2023-01-24 05:28:21.946913: step: 1844/530, loss: 0.002047961577773094 2023-01-24 05:28:22.990471: step: 1848/530, loss: 0.032293811440467834 2023-01-24 05:28:24.034981: step: 1852/530, loss: 0.04200919345021248 2023-01-24 05:28:25.069602: step: 1856/530, loss: 0.006460108328610659 2023-01-24 05:28:26.106576: step: 1860/530, loss: 0.005821909289807081 2023-01-24 05:28:27.153205: step: 1864/530, loss: 0.03500371426343918 2023-01-24 05:28:28.190082: step: 1868/530, loss: 0.004076194949448109 2023-01-24 05:28:29.227805: step: 1872/530, loss: 0.026200944557785988 2023-01-24 05:28:30.268253: step: 1876/530, loss: 0.006102739367634058 2023-01-24 05:28:31.306674: step: 1880/530, loss: 0.0129562858492136 2023-01-24 05:28:32.345593: step: 1884/530, loss: 0.0 2023-01-24 05:28:33.397334: step: 1888/530, loss: 0.005350232124328613 2023-01-24 05:28:34.435346: step: 1892/530, loss: 0.04558427631855011 2023-01-24 05:28:35.469502: step: 1896/530, loss: 0.007803677581250668 2023-01-24 05:28:36.492015: step: 1900/530, loss: 0.011326824314892292 2023-01-24 05:28:37.544071: step: 1904/530, loss: 0.009796587750315666 2023-01-24 05:28:38.580114: step: 1908/530, loss: 0.024081693962216377 2023-01-24 05:28:39.637908: step: 1912/530, loss: 0.019140874966979027 2023-01-24 05:28:40.673618: step: 1916/530, loss: 0.020053837448358536 2023-01-24 05:28:41.708815: step: 1920/530, loss: 0.005911235697567463 2023-01-24 05:28:42.738538: step: 1924/530, loss: 0.04242753982543945 2023-01-24 05:28:43.774659: step: 1928/530, loss: 0.0036718174815177917 2023-01-24 05:28:44.812568: step: 1932/530, loss: 0.010214921087026596 2023-01-24 05:28:45.853300: step: 1936/530, loss: 0.004558503162115812 2023-01-24 05:28:46.897835: step: 1940/530, loss: 0.006958734709769487 2023-01-24 05:28:47.945161: step: 1944/530, loss: 0.006459183059632778 2023-01-24 05:28:48.999977: step: 1948/530, loss: 0.0028059878386557102 2023-01-24 05:28:50.039599: step: 1952/530, loss: 0.0032257791608572006 2023-01-24 05:28:51.078494: step: 1956/530, loss: 0.008603297173976898 2023-01-24 05:28:52.115617: step: 1960/530, loss: 0.023853909224271774 2023-01-24 05:28:53.175209: step: 1964/530, loss: 0.0091539416462183 2023-01-24 05:28:54.215673: step: 1968/530, loss: 0.009850227274000645 2023-01-24 05:28:55.251716: step: 1972/530, loss: 0.013459211215376854 2023-01-24 05:28:56.286306: step: 1976/530, loss: 0.005713855382055044 2023-01-24 05:28:57.325604: step: 1980/530, loss: 0.0053106388077139854 2023-01-24 05:28:58.356306: step: 1984/530, loss: 0.058550428599119186 2023-01-24 05:28:59.389479: step: 1988/530, loss: 0.0019260910339653492 2023-01-24 05:29:00.437689: step: 1992/530, loss: 0.005154873710125685 2023-01-24 05:29:01.494758: step: 1996/530, loss: 0.0057460288517177105 2023-01-24 05:29:02.526123: step: 2000/530, loss: 0.004854988772422075 2023-01-24 05:29:03.563576: step: 2004/530, loss: 0.035891011357307434 2023-01-24 05:29:04.611556: step: 2008/530, loss: 0.03619098290801048 2023-01-24 05:29:05.663000: step: 2012/530, loss: 0.026967423036694527 2023-01-24 05:29:06.693257: step: 2016/530, loss: 0.0007727580377832055 2023-01-24 05:29:07.738015: step: 2020/530, loss: 0.00412522628903389 2023-01-24 05:29:08.776104: step: 2024/530, loss: 0.004455647896975279 2023-01-24 05:29:09.805869: step: 2028/530, loss: 0.0035373647697269917 2023-01-24 05:29:10.852654: step: 2032/530, loss: 0.01102820411324501 2023-01-24 05:29:11.896020: step: 2036/530, loss: 0.019225461408495903 2023-01-24 05:29:12.938740: step: 2040/530, loss: 0.00877375528216362 2023-01-24 05:29:13.985705: step: 2044/530, loss: 0.009944208897650242 2023-01-24 05:29:15.016392: step: 2048/530, loss: 0.002099336124956608 2023-01-24 05:29:16.077705: step: 2052/530, loss: 0.0059543452225625515 2023-01-24 05:29:17.136087: step: 2056/530, loss: 0.00714087812229991 2023-01-24 05:29:18.176130: step: 2060/530, loss: 0.009105266071856022 2023-01-24 05:29:19.204940: step: 2064/530, loss: 0.004115113522857428 2023-01-24 05:29:20.253177: step: 2068/530, loss: 0.0011670852545648813 2023-01-24 05:29:21.307606: step: 2072/530, loss: 0.018462466076016426 2023-01-24 05:29:22.346405: step: 2076/530, loss: 0.0032242254819720984 2023-01-24 05:29:23.411591: step: 2080/530, loss: 0.0011447686702013016 2023-01-24 05:29:24.443871: step: 2084/530, loss: 0.00122128298971802 2023-01-24 05:29:25.496232: step: 2088/530, loss: 0.03524351119995117 2023-01-24 05:29:26.534228: step: 2092/530, loss: 0.00704927509650588 2023-01-24 05:29:27.593154: step: 2096/530, loss: 0.006289287470281124 2023-01-24 05:29:28.632762: step: 2100/530, loss: 0.004395214840769768 2023-01-24 05:29:29.682118: step: 2104/530, loss: 0.023771753534674644 2023-01-24 05:29:30.731898: step: 2108/530, loss: 0.001265095779672265 2023-01-24 05:29:31.757993: step: 2112/530, loss: 0.0093479473143816 2023-01-24 05:29:32.802223: step: 2116/530, loss: 0.004298749379813671 2023-01-24 05:29:33.851258: step: 2120/530, loss: 0.028923824429512024 ================================================== Loss: 0.013 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.36750277161862527, 'r': 0.3145042694497154, 'f1': 0.33894427402862987}, 'combined': 0.24974841244214832, 'stategy': 1, 'epoch': 2} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37477468848365025, 'r': 0.3916533279466088, 'f1': 0.3830281535334026}, 'combined': 0.29689263575316377, 'stategy': 1, 'epoch': 2} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3735914626571876, 'r': 0.32538611263690537, 'f1': 0.34782653419807125}, 'combined': 0.2562932357248946, 'stategy': 1, 'epoch': 2} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3567007815200777, 'r': 0.35932358138419596, 'f1': 0.358007377789382}, 'combined': 0.27749854163578896, 'stategy': 1, 'epoch': 2} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 2} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 2} New best korean model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3738546380090498, 'r': 0.3135555028462998, 'f1': 0.34106037151702784}, 'combined': 0.25130764217044155, 'stategy': 1, 'epoch': 0} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36737558326918535, 'r': 0.3794979673183977, 'f1': 0.373338397064357}, 'combined': 0.28938191542787484, 'stategy': 1, 'epoch': 0} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 0} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 3 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 05:32:07.403038: step: 4/530, loss: 0.005431821569800377 2023-01-24 05:32:08.451239: step: 8/530, loss: 0.009996199049055576 2023-01-24 05:32:09.478712: step: 12/530, loss: 0.002863501198589802 2023-01-24 05:32:10.507262: step: 16/530, loss: 0.01014662254601717 2023-01-24 05:32:11.551712: step: 20/530, loss: 0.01043922919780016 2023-01-24 05:32:12.599446: step: 24/530, loss: 0.026406753808259964 2023-01-24 05:32:13.635333: step: 28/530, loss: 0.009597786702215672 2023-01-24 05:32:14.684137: step: 32/530, loss: 0.002693016780540347 2023-01-24 05:32:15.724618: step: 36/530, loss: 0.00951580610126257 2023-01-24 05:32:16.765121: step: 40/530, loss: 0.004581989720463753 2023-01-24 05:32:17.807774: step: 44/530, loss: 0.023599563166499138 2023-01-24 05:32:18.836153: step: 48/530, loss: 0.0036640758626163006 2023-01-24 05:32:19.864531: step: 52/530, loss: 0.004040162544697523 2023-01-24 05:32:20.895268: step: 56/530, loss: 0.005668823607265949 2023-01-24 05:32:21.929286: step: 60/530, loss: 0.003638617228716612 2023-01-24 05:32:22.964765: step: 64/530, loss: 0.006536995060741901 2023-01-24 05:32:24.006611: step: 68/530, loss: 0.007913414388895035 2023-01-24 05:32:25.052180: step: 72/530, loss: 0.03715172037482262 2023-01-24 05:32:26.093604: step: 76/530, loss: 0.007902665063738823 2023-01-24 05:32:27.141078: step: 80/530, loss: 0.015202267095446587 2023-01-24 05:32:28.177688: step: 84/530, loss: 0.005592564586549997 2023-01-24 05:32:29.213701: step: 88/530, loss: 0.017473073676228523 2023-01-24 05:32:30.258244: step: 92/530, loss: 0.010819935239851475 2023-01-24 05:32:31.290061: step: 96/530, loss: 0.00913731288164854 2023-01-24 05:32:32.320402: step: 100/530, loss: 0.005119699519127607 2023-01-24 05:32:33.386409: step: 104/530, loss: 0.005616622511297464 2023-01-24 05:32:34.442237: step: 108/530, loss: 0.019643492996692657 2023-01-24 05:32:35.470011: step: 112/530, loss: 0.010574262589216232 2023-01-24 05:32:36.516343: step: 116/530, loss: 0.005679734982550144 2023-01-24 05:32:37.566199: step: 120/530, loss: 0.004575694911181927 2023-01-24 05:32:38.605916: step: 124/530, loss: 0.0025474310386925936 2023-01-24 05:32:39.660855: step: 128/530, loss: 0.0032287563662976027 2023-01-24 05:32:40.718498: step: 132/530, loss: 0.00046567703248001635 2023-01-24 05:32:41.763224: step: 136/530, loss: 0.01558406837284565 2023-01-24 05:32:42.799133: step: 140/530, loss: 0.0031504291109740734 2023-01-24 05:32:43.833689: step: 144/530, loss: 0.004133196547627449 2023-01-24 05:32:44.882407: step: 148/530, loss: 0.007097297813743353 2023-01-24 05:32:45.917429: step: 152/530, loss: 0.020086877048015594 2023-01-24 05:32:46.960125: step: 156/530, loss: 0.016046728938817978 2023-01-24 05:32:47.985267: step: 160/530, loss: 0.008558408357203007 2023-01-24 05:32:49.047375: step: 164/530, loss: 0.0038368371315300465 2023-01-24 05:32:50.093700: step: 168/530, loss: 0.008134753443300724 2023-01-24 05:32:51.140150: step: 172/530, loss: 0.0055014705285429955 2023-01-24 05:32:52.198096: step: 176/530, loss: 0.0055412412621080875 2023-01-24 05:32:53.232979: step: 180/530, loss: 0.04135976359248161 2023-01-24 05:32:54.270335: step: 184/530, loss: 0.011304151266813278 2023-01-24 05:32:55.314640: step: 188/530, loss: 0.007178763393312693 2023-01-24 05:32:56.373688: step: 192/530, loss: 0.007974209263920784 2023-01-24 05:32:57.452893: step: 196/530, loss: 0.006611658725887537 2023-01-24 05:32:58.492081: step: 200/530, loss: 0.007347870152443647 2023-01-24 05:32:59.545335: step: 204/530, loss: 0.0027312615420669317 2023-01-24 05:33:00.589979: step: 208/530, loss: 0.005284967366605997 2023-01-24 05:33:01.627466: step: 212/530, loss: 0.009669600985944271 2023-01-24 05:33:02.684707: step: 216/530, loss: 0.01777213253080845 2023-01-24 05:33:03.730574: step: 220/530, loss: 0.008092140778899193 2023-01-24 05:33:04.776610: step: 224/530, loss: 0.013502043671905994 2023-01-24 05:33:05.841269: step: 228/530, loss: 0.00566902058199048 2023-01-24 05:33:06.920808: step: 232/530, loss: 0.0021324350964277983 2023-01-24 05:33:07.969404: step: 236/530, loss: 0.0709192305803299 2023-01-24 05:33:09.006593: step: 240/530, loss: 0.006102538201957941 2023-01-24 05:33:10.056715: step: 244/530, loss: 0.024573395028710365 2023-01-24 05:33:11.101545: step: 248/530, loss: 0.009836941957473755 2023-01-24 05:33:12.150369: step: 252/530, loss: 0.0063698445446789265 2023-01-24 05:33:13.212149: step: 256/530, loss: 0.07554195821285248 2023-01-24 05:33:14.246237: step: 260/530, loss: 0.004398987628519535 2023-01-24 05:33:15.275678: step: 264/530, loss: 0.01768602430820465 2023-01-24 05:33:16.331722: step: 268/530, loss: 0.0414053350687027 2023-01-24 05:33:17.367718: step: 272/530, loss: 0.018624572083353996 2023-01-24 05:33:18.429957: step: 276/530, loss: 0.02465970069169998 2023-01-24 05:33:19.468534: step: 280/530, loss: 0.016789887100458145 2023-01-24 05:33:20.532183: step: 284/530, loss: 0.02029453217983246 2023-01-24 05:33:21.582806: step: 288/530, loss: 0.005288269836455584 2023-01-24 05:33:22.631465: step: 292/530, loss: 0.003636611858382821 2023-01-24 05:33:23.675683: step: 296/530, loss: 0.026374856010079384 2023-01-24 05:33:24.728876: step: 300/530, loss: 0.002348975045606494 2023-01-24 05:33:25.775513: step: 304/530, loss: 0.009162580594420433 2023-01-24 05:33:26.816052: step: 308/530, loss: 0.004208069294691086 2023-01-24 05:33:27.868601: step: 312/530, loss: 0.020622577518224716 2023-01-24 05:33:28.900817: step: 316/530, loss: 0.0021263256203383207 2023-01-24 05:33:29.962221: step: 320/530, loss: 0.007317597512155771 2023-01-24 05:33:30.994529: step: 324/530, loss: 0.0004972377209924161 2023-01-24 05:33:32.054737: step: 328/530, loss: 0.0056449174880981445 2023-01-24 05:33:33.104174: step: 332/530, loss: 0.0039084292948246 2023-01-24 05:33:34.147978: step: 336/530, loss: 0.00307081057690084 2023-01-24 05:33:35.195729: step: 340/530, loss: 0.02081211656332016 2023-01-24 05:33:36.266052: step: 344/530, loss: 0.017144719138741493 2023-01-24 05:33:37.321461: step: 348/530, loss: 0.002932160161435604 2023-01-24 05:33:38.363683: step: 352/530, loss: 0.012656448408961296 2023-01-24 05:33:39.429869: step: 356/530, loss: 0.000280795618891716 2023-01-24 05:33:40.472684: step: 360/530, loss: 0.0072136023081839085 2023-01-24 05:33:41.519426: step: 364/530, loss: 0.007043606601655483 2023-01-24 05:33:42.559948: step: 368/530, loss: 0.013517667539417744 2023-01-24 05:33:43.596052: step: 372/530, loss: 0.004874826408922672 2023-01-24 05:33:44.632532: step: 376/530, loss: 0.003717508865520358 2023-01-24 05:33:45.687877: step: 380/530, loss: 0.010346094146370888 2023-01-24 05:33:46.744633: step: 384/530, loss: 0.0156561266630888 2023-01-24 05:33:47.795119: step: 388/530, loss: 0.012330153957009315 2023-01-24 05:33:48.836599: step: 392/530, loss: 0.006983927451074123 2023-01-24 05:33:49.893127: step: 396/530, loss: 0.00360304513014853 2023-01-24 05:33:50.944100: step: 400/530, loss: 0.0014622666640207171 2023-01-24 05:33:51.991530: step: 404/530, loss: 0.0037822534795850515 2023-01-24 05:33:53.039437: step: 408/530, loss: 0.009406151250004768 2023-01-24 05:33:54.102333: step: 412/530, loss: 0.02384459413588047 2023-01-24 05:33:55.142511: step: 416/530, loss: 0.003428320400416851 2023-01-24 05:33:56.186943: step: 420/530, loss: 0.001968947472050786 2023-01-24 05:33:57.252104: step: 424/530, loss: 0.002706412458792329 2023-01-24 05:33:58.311473: step: 428/530, loss: 0.00510001927614212 2023-01-24 05:33:59.360218: step: 432/530, loss: 0.05905650928616524 2023-01-24 05:34:00.412807: step: 436/530, loss: 0.034021515399217606 2023-01-24 05:34:01.455361: step: 440/530, loss: 0.004314336460083723 2023-01-24 05:34:02.500235: step: 444/530, loss: 0.00461387075483799 2023-01-24 05:34:03.551563: step: 448/530, loss: 0.003960966132581234 2023-01-24 05:34:04.608863: step: 452/530, loss: 0.008891516365110874 2023-01-24 05:34:05.657674: step: 456/530, loss: 0.004702720325440168 2023-01-24 05:34:06.721968: step: 460/530, loss: 0.00783851370215416 2023-01-24 05:34:07.764101: step: 464/530, loss: 0.003973011393100023 2023-01-24 05:34:08.807008: step: 468/530, loss: 0.0057945833541452885 2023-01-24 05:34:09.849214: step: 472/530, loss: 0.006109802983701229 2023-01-24 05:34:10.891108: step: 476/530, loss: 0.004593989811837673 2023-01-24 05:34:11.942384: step: 480/530, loss: 0.004475194960832596 2023-01-24 05:34:13.011403: step: 484/530, loss: 0.0083687175065279 2023-01-24 05:34:14.056635: step: 488/530, loss: 0.004098036326467991 2023-01-24 05:34:15.108803: step: 492/530, loss: 0.007627636194229126 2023-01-24 05:34:16.166304: step: 496/530, loss: 0.039637550711631775 2023-01-24 05:34:17.202515: step: 500/530, loss: 0.004907737020403147 2023-01-24 05:34:18.252746: step: 504/530, loss: 0.0031770847272127867 2023-01-24 05:34:19.289178: step: 508/530, loss: 0.005108467768877745 2023-01-24 05:34:20.331213: step: 512/530, loss: 0.004742048680782318 2023-01-24 05:34:21.380210: step: 516/530, loss: 0.006341639906167984 2023-01-24 05:34:22.416863: step: 520/530, loss: 0.0015437587862834334 2023-01-24 05:34:23.469469: step: 524/530, loss: 0.011380205862224102 2023-01-24 05:34:24.514888: step: 528/530, loss: 0.004746524151414633 2023-01-24 05:34:25.582110: step: 532/530, loss: 0.015550093725323677 2023-01-24 05:34:26.620631: step: 536/530, loss: 0.0020516414660960436 2023-01-24 05:34:27.665002: step: 540/530, loss: 0.005931579973548651 2023-01-24 05:34:28.723180: step: 544/530, loss: 0.00400571059435606 2023-01-24 05:34:29.789342: step: 548/530, loss: 0.0054653421975672245 2023-01-24 05:34:30.835503: step: 552/530, loss: 0.003762952983379364 2023-01-24 05:34:31.883431: step: 556/530, loss: 0.015496413223445415 2023-01-24 05:34:32.950535: step: 560/530, loss: 0.03712219372391701 2023-01-24 05:34:33.989593: step: 564/530, loss: 0.03386061638593674 2023-01-24 05:34:35.049735: step: 568/530, loss: 0.0016969263087958097 2023-01-24 05:34:36.106654: step: 572/530, loss: 0.010116786696016788 2023-01-24 05:34:37.137823: step: 576/530, loss: 0.011949919164180756 2023-01-24 05:34:38.203763: step: 580/530, loss: 0.022678064182400703 2023-01-24 05:34:39.249623: step: 584/530, loss: 0.026317300274968147 2023-01-24 05:34:40.288906: step: 588/530, loss: 0.0053278496488928795 2023-01-24 05:34:41.318674: step: 592/530, loss: 0.017307987436652184 2023-01-24 05:34:42.381525: step: 596/530, loss: 0.017238279804587364 2023-01-24 05:34:43.455481: step: 600/530, loss: 0.026832664385437965 2023-01-24 05:34:44.509295: step: 604/530, loss: 0.015705600380897522 2023-01-24 05:34:45.543140: step: 608/530, loss: 0.005115372594445944 2023-01-24 05:34:46.587658: step: 612/530, loss: 0.005850158631801605 2023-01-24 05:34:47.646013: step: 616/530, loss: 0.0015624072402715683 2023-01-24 05:34:48.691172: step: 620/530, loss: 0.0031924168579280376 2023-01-24 05:34:49.748766: step: 624/530, loss: 0.010317697189748287 2023-01-24 05:34:50.799769: step: 628/530, loss: 0.0330805741250515 2023-01-24 05:34:51.841363: step: 632/530, loss: 0.02072126604616642 2023-01-24 05:34:52.894927: step: 636/530, loss: 0.0029019995126873255 2023-01-24 05:34:53.952285: step: 640/530, loss: 0.0052552009001374245 2023-01-24 05:34:55.002448: step: 644/530, loss: 0.009886824525892735 2023-01-24 05:34:56.050285: step: 648/530, loss: 0.01690363511443138 2023-01-24 05:34:57.095987: step: 652/530, loss: 0.01833905093371868 2023-01-24 05:34:58.148581: step: 656/530, loss: 0.008822561241686344 2023-01-24 05:34:59.193901: step: 660/530, loss: 0.006634217221289873 2023-01-24 05:35:00.259234: step: 664/530, loss: 0.010887330397963524 2023-01-24 05:35:01.314185: step: 668/530, loss: 0.004357458092272282 2023-01-24 05:35:02.352093: step: 672/530, loss: 0.004532279912382364 2023-01-24 05:35:03.398376: step: 676/530, loss: 0.0032102311961352825 2023-01-24 05:35:04.445503: step: 680/530, loss: 0.00895298644900322 2023-01-24 05:35:05.493248: step: 684/530, loss: 0.05064159631729126 2023-01-24 05:35:06.535549: step: 688/530, loss: 0.006235008593648672 2023-01-24 05:35:07.609930: step: 692/530, loss: 0.020631618797779083 2023-01-24 05:35:08.655316: step: 696/530, loss: 0.0035677680280059576 2023-01-24 05:35:09.690529: step: 700/530, loss: 0.0010200878605246544 2023-01-24 05:35:10.742820: step: 704/530, loss: 0.009017433039844036 2023-01-24 05:35:11.791524: step: 708/530, loss: 0.005654364824295044 2023-01-24 05:35:12.845075: step: 712/530, loss: 0.0012615763116627932 2023-01-24 05:35:13.921376: step: 716/530, loss: 0.008098145946860313 2023-01-24 05:35:14.966716: step: 720/530, loss: 0.009016198106110096 2023-01-24 05:35:16.047619: step: 724/530, loss: 0.009763686917722225 2023-01-24 05:35:17.096156: step: 728/530, loss: 0.005619431380182505 2023-01-24 05:35:18.141535: step: 732/530, loss: 0.00087446573888883 2023-01-24 05:35:19.183518: step: 736/530, loss: 0.01173071376979351 2023-01-24 05:35:20.239571: step: 740/530, loss: 0.0013534734025597572 2023-01-24 05:35:21.271581: step: 744/530, loss: 0.006439316552132368 2023-01-24 05:35:22.346836: step: 748/530, loss: 0.0033913280349224806 2023-01-24 05:35:23.375509: step: 752/530, loss: 0.007247533183544874 2023-01-24 05:35:24.429546: step: 756/530, loss: 0.0018336847424507141 2023-01-24 05:35:25.466716: step: 760/530, loss: 0.006364730652421713 2023-01-24 05:35:26.508264: step: 764/530, loss: 0.002719556214287877 2023-01-24 05:35:27.576016: step: 768/530, loss: 0.026545636355876923 2023-01-24 05:35:28.628181: step: 772/530, loss: 0.011393429711461067 2023-01-24 05:35:29.681827: step: 776/530, loss: 0.007845165207982063 2023-01-24 05:35:30.727221: step: 780/530, loss: 0.032166190445423126 2023-01-24 05:35:31.769124: step: 784/530, loss: 0.01356776524335146 2023-01-24 05:35:32.817468: step: 788/530, loss: 0.007504757028073072 2023-01-24 05:35:33.887606: step: 792/530, loss: 0.0068154968321323395 2023-01-24 05:35:34.928284: step: 796/530, loss: 0.00044549262383952737 2023-01-24 05:35:35.966266: step: 800/530, loss: 0.0025988593697547913 2023-01-24 05:35:37.002339: step: 804/530, loss: 0.0017277478473260999 2023-01-24 05:35:38.048902: step: 808/530, loss: 0.028265642002224922 2023-01-24 05:35:39.097949: step: 812/530, loss: 0.00908300094306469 2023-01-24 05:35:40.148190: step: 816/530, loss: 0.003962434828281403 2023-01-24 05:35:41.199459: step: 820/530, loss: 0.029387155547738075 2023-01-24 05:35:42.236050: step: 824/530, loss: 0.01663140393793583 2023-01-24 05:35:43.287418: step: 828/530, loss: 0.027380110695958138 2023-01-24 05:35:44.344565: step: 832/530, loss: 0.02776745893061161 2023-01-24 05:35:45.369911: step: 836/530, loss: 0.012709911912679672 2023-01-24 05:35:46.409934: step: 840/530, loss: 0.010074610821902752 2023-01-24 05:35:47.462932: step: 844/530, loss: 0.009502899833023548 2023-01-24 05:35:48.503307: step: 848/530, loss: 0.011394928209483624 2023-01-24 05:35:49.551462: step: 852/530, loss: 0.0006734206690452993 2023-01-24 05:35:50.590379: step: 856/530, loss: 0.011475330218672752 2023-01-24 05:35:51.647385: step: 860/530, loss: 0.021002793684601784 2023-01-24 05:35:52.681106: step: 864/530, loss: 0.012125730514526367 2023-01-24 05:35:53.716819: step: 868/530, loss: 0.0024132307153195143 2023-01-24 05:35:54.777514: step: 872/530, loss: 0.004029131960123777 2023-01-24 05:35:55.811588: step: 876/530, loss: 0.015598522499203682 2023-01-24 05:35:56.856800: step: 880/530, loss: 0.032264843583106995 2023-01-24 05:35:57.903335: step: 884/530, loss: 0.009966591373085976 2023-01-24 05:35:58.954837: step: 888/530, loss: 0.014536065980792046 2023-01-24 05:36:00.004698: step: 892/530, loss: 0.007731547579169273 2023-01-24 05:36:01.055661: step: 896/530, loss: 0.005296436604112387 2023-01-24 05:36:02.153720: step: 900/530, loss: 0.008345085196197033 2023-01-24 05:36:03.184648: step: 904/530, loss: 0.004201252479106188 2023-01-24 05:36:04.232338: step: 908/530, loss: 0.004555849824100733 2023-01-24 05:36:05.268458: step: 912/530, loss: 0.006779415998607874 2023-01-24 05:36:06.321384: step: 916/530, loss: 0.0053204880096018314 2023-01-24 05:36:07.357529: step: 920/530, loss: 0.018930848687887192 2023-01-24 05:36:08.405324: step: 924/530, loss: 0.013539772480726242 2023-01-24 05:36:09.448055: step: 928/530, loss: 0.023202110081911087 2023-01-24 05:36:10.494545: step: 932/530, loss: 0.022371899336576462 2023-01-24 05:36:11.543493: step: 936/530, loss: 0.004724096041172743 2023-01-24 05:36:12.584201: step: 940/530, loss: 0.005772337317466736 2023-01-24 05:36:13.607910: step: 944/530, loss: 0.005176054313778877 2023-01-24 05:36:14.646682: step: 948/530, loss: 0.003047067206352949 2023-01-24 05:36:15.714858: step: 952/530, loss: 0.02281697653234005 2023-01-24 05:36:16.760305: step: 956/530, loss: 0.005941150244325399 2023-01-24 05:36:17.802893: step: 960/530, loss: 0.019261520355939865 2023-01-24 05:36:18.852187: step: 964/530, loss: 0.006394181400537491 2023-01-24 05:36:19.899848: step: 968/530, loss: 0.010386641137301922 2023-01-24 05:36:20.934478: step: 972/530, loss: 0.002203629817813635 2023-01-24 05:36:21.974481: step: 976/530, loss: 0.023285146802663803 2023-01-24 05:36:23.020318: step: 980/530, loss: 0.03983256220817566 2023-01-24 05:36:24.059131: step: 984/530, loss: 0.017802519723773003 2023-01-24 05:36:25.089663: step: 988/530, loss: 0.010056165978312492 2023-01-24 05:36:26.134535: step: 992/530, loss: 0.003944454248994589 2023-01-24 05:36:27.173893: step: 996/530, loss: 0.010143429972231388 2023-01-24 05:36:28.216314: step: 1000/530, loss: 0.007448958232998848 2023-01-24 05:36:29.252537: step: 1004/530, loss: 0.026389002799987793 2023-01-24 05:36:30.308413: step: 1008/530, loss: 0.02232789620757103 2023-01-24 05:36:31.344797: step: 1012/530, loss: 0.004627691116183996 2023-01-24 05:36:32.375850: step: 1016/530, loss: 0.01990676485002041 2023-01-24 05:36:33.413405: step: 1020/530, loss: 0.007293072063475847 2023-01-24 05:36:34.467518: step: 1024/530, loss: 0.0034510032273828983 2023-01-24 05:36:35.515816: step: 1028/530, loss: 0.03335084393620491 2023-01-24 05:36:36.552234: step: 1032/530, loss: 0.021045751869678497 2023-01-24 05:36:37.591584: step: 1036/530, loss: 0.022299353033304214 2023-01-24 05:36:38.655549: step: 1040/530, loss: 0.004965097177773714 2023-01-24 05:36:39.709438: step: 1044/530, loss: 0.0012303362600505352 2023-01-24 05:36:40.755310: step: 1048/530, loss: 0.012189645320177078 2023-01-24 05:36:41.799128: step: 1052/530, loss: 0.009075603447854519 2023-01-24 05:36:42.828753: step: 1056/530, loss: 0.007207685615867376 2023-01-24 05:36:43.880705: step: 1060/530, loss: 0.003411687444895506 2023-01-24 05:36:44.922199: step: 1064/530, loss: 0.0025498555041849613 2023-01-24 05:36:45.972343: step: 1068/530, loss: 0.005067363381385803 2023-01-24 05:36:47.020136: step: 1072/530, loss: 0.004650200717151165 2023-01-24 05:36:48.061133: step: 1076/530, loss: 0.009816146455705166 2023-01-24 05:36:49.098704: step: 1080/530, loss: 0.007132126018404961 2023-01-24 05:36:50.149319: step: 1084/530, loss: 0.013316216878592968 2023-01-24 05:36:51.208348: step: 1088/530, loss: 0.009215674363076687 2023-01-24 05:36:52.257140: step: 1092/530, loss: 0.010878689587116241 2023-01-24 05:36:53.312927: step: 1096/530, loss: 0.008455169387161732 2023-01-24 05:36:54.376398: step: 1100/530, loss: 0.0463222935795784 2023-01-24 05:36:55.408252: step: 1104/530, loss: 0.0018649438861757517 2023-01-24 05:36:56.434611: step: 1108/530, loss: 0.014679823070764542 2023-01-24 05:36:57.476237: step: 1112/530, loss: 0.013960030861198902 2023-01-24 05:36:58.531365: step: 1116/530, loss: 0.009450647979974747 2023-01-24 05:36:59.566838: step: 1120/530, loss: 0.005764094181358814 2023-01-24 05:37:00.633451: step: 1124/530, loss: 0.002159183146432042 2023-01-24 05:37:01.695581: step: 1128/530, loss: 0.006127052009105682 2023-01-24 05:37:02.736904: step: 1132/530, loss: 0.004724337253719568 2023-01-24 05:37:03.792046: step: 1136/530, loss: 0.010194825008511543 2023-01-24 05:37:04.842689: step: 1140/530, loss: 0.012295125052332878 2023-01-24 05:37:05.873959: step: 1144/530, loss: 0.03260317072272301 2023-01-24 05:37:06.930165: step: 1148/530, loss: 0.028742346912622452 2023-01-24 05:37:07.973339: step: 1152/530, loss: 0.006975257769227028 2023-01-24 05:37:09.018290: step: 1156/530, loss: 0.038547661155462265 2023-01-24 05:37:10.065110: step: 1160/530, loss: 0.0048523638397455215 2023-01-24 05:37:11.093591: step: 1164/530, loss: 0.003225501161068678 2023-01-24 05:37:12.130283: step: 1168/530, loss: 0.005581739824265242 2023-01-24 05:37:13.161588: step: 1172/530, loss: 0.016334837302565575 2023-01-24 05:37:14.211950: step: 1176/530, loss: 0.0056094275787472725 2023-01-24 05:37:15.262775: step: 1180/530, loss: 0.0046770451590418816 2023-01-24 05:37:16.320792: step: 1184/530, loss: 0.00882962066680193 2023-01-24 05:37:17.364415: step: 1188/530, loss: 0.007463640533387661 2023-01-24 05:37:18.404907: step: 1192/530, loss: 0.03753942996263504 2023-01-24 05:37:19.440566: step: 1196/530, loss: 0.0013762930175289512 2023-01-24 05:37:20.501166: step: 1200/530, loss: 0.0070342812687158585 2023-01-24 05:37:21.520944: step: 1204/530, loss: 0.002245308831334114 2023-01-24 05:37:22.575187: step: 1208/530, loss: 0.004292265046387911 2023-01-24 05:37:23.611991: step: 1212/530, loss: 0.003306174650788307 2023-01-24 05:37:24.668145: step: 1216/530, loss: 0.003461097367107868 2023-01-24 05:37:25.712660: step: 1220/530, loss: 0.008810692466795444 2023-01-24 05:37:26.768931: step: 1224/530, loss: 0.004546773619949818 2023-01-24 05:37:27.799632: step: 1228/530, loss: 0.014986623078584671 2023-01-24 05:37:28.839724: step: 1232/530, loss: 0.003765576519072056 2023-01-24 05:37:29.879318: step: 1236/530, loss: 0.009695884771645069 2023-01-24 05:37:30.921539: step: 1240/530, loss: 0.001070527476258576 2023-01-24 05:37:31.967260: step: 1244/530, loss: 0.0036728207487612963 2023-01-24 05:37:33.001818: step: 1248/530, loss: 0.006865540519356728 2023-01-24 05:37:34.053480: step: 1252/530, loss: 0.001643989933654666 2023-01-24 05:37:35.081893: step: 1256/530, loss: 0.007976176217198372 2023-01-24 05:37:36.123197: step: 1260/530, loss: 0.03025640919804573 2023-01-24 05:37:37.178691: step: 1264/530, loss: 0.002342989668250084 2023-01-24 05:37:38.227655: step: 1268/530, loss: 0.0005315643502399325 2023-01-24 05:37:39.269729: step: 1272/530, loss: 0.010589626617729664 2023-01-24 05:37:40.315435: step: 1276/530, loss: 0.016972288489341736 2023-01-24 05:37:41.361136: step: 1280/530, loss: 0.003189470386132598 2023-01-24 05:37:42.407061: step: 1284/530, loss: 0.0029718868900090456 2023-01-24 05:37:43.447969: step: 1288/530, loss: 0.011221029795706272 2023-01-24 05:37:44.493269: step: 1292/530, loss: 0.00947148259729147 2023-01-24 05:37:45.541155: step: 1296/530, loss: 0.005764075554907322 2023-01-24 05:37:46.585302: step: 1300/530, loss: 0.01618027128279209 2023-01-24 05:37:47.621241: step: 1304/530, loss: 0.01004018634557724 2023-01-24 05:37:48.672687: step: 1308/530, loss: 0.059785742312669754 2023-01-24 05:37:49.731648: step: 1312/530, loss: 0.01082677859812975 2023-01-24 05:37:50.758120: step: 1316/530, loss: 0.004467769525945187 2023-01-24 05:37:51.805619: step: 1320/530, loss: 0.0015378388343378901 2023-01-24 05:37:52.860557: step: 1324/530, loss: 0.028778837993741035 2023-01-24 05:37:53.894038: step: 1328/530, loss: 0.007330745458602905 2023-01-24 05:37:54.937413: step: 1332/530, loss: 0.012670734897255898 2023-01-24 05:37:55.978048: step: 1336/530, loss: 0.0005725579103454947 2023-01-24 05:37:57.031653: step: 1340/530, loss: 0.026643341407179832 2023-01-24 05:37:58.072667: step: 1344/530, loss: 0.03726726397871971 2023-01-24 05:37:59.110453: step: 1348/530, loss: 0.0052210381254553795 2023-01-24 05:38:00.174042: step: 1352/530, loss: 0.0029350989498198032 2023-01-24 05:38:01.218505: step: 1356/530, loss: 0.0041256071999669075 2023-01-24 05:38:02.264602: step: 1360/530, loss: 0.006800183095037937 2023-01-24 05:38:03.300220: step: 1364/530, loss: 0.005037812516093254 2023-01-24 05:38:04.346135: step: 1368/530, loss: 0.005107303615659475 2023-01-24 05:38:05.377132: step: 1372/530, loss: 0.010213006287813187 2023-01-24 05:38:06.426431: step: 1376/530, loss: 0.004052733536809683 2023-01-24 05:38:07.461465: step: 1380/530, loss: 0.008409635163843632 2023-01-24 05:38:08.496271: step: 1384/530, loss: 0.0036329312715679407 2023-01-24 05:38:09.551556: step: 1388/530, loss: 0.016174299642443657 2023-01-24 05:38:10.598928: step: 1392/530, loss: 0.001608862541615963 2023-01-24 05:38:11.637034: step: 1396/530, loss: 0.005092690233141184 2023-01-24 05:38:12.677438: step: 1400/530, loss: 0.005035769194364548 2023-01-24 05:38:13.713471: step: 1404/530, loss: 0.03963950276374817 2023-01-24 05:38:14.760326: step: 1408/530, loss: 0.0007013366557657719 2023-01-24 05:38:15.801459: step: 1412/530, loss: 0.002183702774345875 2023-01-24 05:38:16.832864: step: 1416/530, loss: 0.0044519598595798016 2023-01-24 05:38:17.887313: step: 1420/530, loss: 0.010128378868103027 2023-01-24 05:38:18.927670: step: 1424/530, loss: 0.004775649402290583 2023-01-24 05:38:19.973445: step: 1428/530, loss: 0.034105680882930756 2023-01-24 05:38:21.006716: step: 1432/530, loss: 0.006160160526633263 2023-01-24 05:38:22.059601: step: 1436/530, loss: 0.005872759502381086 2023-01-24 05:38:23.097023: step: 1440/530, loss: 0.007892990484833717 2023-01-24 05:38:24.141272: step: 1444/530, loss: 0.005610210355371237 2023-01-24 05:38:25.172148: step: 1448/530, loss: 0.0038250540383160114 2023-01-24 05:38:26.224196: step: 1452/530, loss: 0.0013907239772379398 2023-01-24 05:38:27.275530: step: 1456/530, loss: 0.01629927195608616 2023-01-24 05:38:28.309965: step: 1460/530, loss: 0.014263872057199478 2023-01-24 05:38:29.358282: step: 1464/530, loss: 0.007095483597368002 2023-01-24 05:38:30.392879: step: 1468/530, loss: 0.008866426534950733 2023-01-24 05:38:31.447621: step: 1472/530, loss: 0.02516775205731392 2023-01-24 05:38:32.491735: step: 1476/530, loss: 0.003279719967395067 2023-01-24 05:38:33.548587: step: 1480/530, loss: 0.007173987105488777 2023-01-24 05:38:34.590777: step: 1484/530, loss: 0.028564566746354103 2023-01-24 05:38:35.625066: step: 1488/530, loss: 0.00827405322343111 2023-01-24 05:38:36.676298: step: 1492/530, loss: 0.0018098428845405579 2023-01-24 05:38:37.715497: step: 1496/530, loss: 0.0017288204981014132 2023-01-24 05:38:38.760513: step: 1500/530, loss: 0.01009152177721262 2023-01-24 05:38:39.801405: step: 1504/530, loss: 0.011685575358569622 2023-01-24 05:38:40.858413: step: 1508/530, loss: 0.024191131815314293 2023-01-24 05:38:41.900207: step: 1512/530, loss: 0.009218844585120678 2023-01-24 05:38:42.935776: step: 1516/530, loss: 0.008201340213418007 2023-01-24 05:38:43.967288: step: 1520/530, loss: 0.007130790967494249 2023-01-24 05:38:45.012174: step: 1524/530, loss: 0.007450486999005079 2023-01-24 05:38:46.066605: step: 1528/530, loss: 0.009018649347126484 2023-01-24 05:38:47.123917: step: 1532/530, loss: 0.02397296577692032 2023-01-24 05:38:48.176156: step: 1536/530, loss: 0.04176093265414238 2023-01-24 05:38:49.242141: step: 1540/530, loss: 0.0031963936053216457 2023-01-24 05:38:50.290848: step: 1544/530, loss: 0.007208811119198799 2023-01-24 05:38:51.322371: step: 1548/530, loss: 0.006259385030716658 2023-01-24 05:38:52.365454: step: 1552/530, loss: 0.004566723946481943 2023-01-24 05:38:53.408884: step: 1556/530, loss: 0.02112419717013836 2023-01-24 05:38:54.456026: step: 1560/530, loss: 0.0035256589762866497 2023-01-24 05:38:55.506201: step: 1564/530, loss: 0.0024700728245079517 2023-01-24 05:38:56.564861: step: 1568/530, loss: 0.0009783357381820679 2023-01-24 05:38:57.625582: step: 1572/530, loss: 0.011006603948771954 2023-01-24 05:38:58.675368: step: 1576/530, loss: 0.004175816662609577 2023-01-24 05:38:59.712623: step: 1580/530, loss: 0.0032647140324115753 2023-01-24 05:39:00.752248: step: 1584/530, loss: 0.003850224893540144 2023-01-24 05:39:01.817389: step: 1588/530, loss: 0.07564166188240051 2023-01-24 05:39:02.861165: step: 1592/530, loss: 0.00911492109298706 2023-01-24 05:39:03.906497: step: 1596/530, loss: 0.01377045176923275 2023-01-24 05:39:04.952425: step: 1600/530, loss: 0.006769889499992132 2023-01-24 05:39:06.015609: step: 1604/530, loss: 0.016160011291503906 2023-01-24 05:39:07.077412: step: 1608/530, loss: 0.02482665702700615 2023-01-24 05:39:08.151044: step: 1612/530, loss: 0.018679991364479065 2023-01-24 05:39:09.191725: step: 1616/530, loss: 0.006689343601465225 2023-01-24 05:39:10.241804: step: 1620/530, loss: 0.012558117508888245 2023-01-24 05:39:11.287762: step: 1624/530, loss: 0.0026630351785570383 2023-01-24 05:39:12.336191: step: 1628/530, loss: 0.0007008531829342246 2023-01-24 05:39:13.376513: step: 1632/530, loss: 0.007186629809439182 2023-01-24 05:39:14.421096: step: 1636/530, loss: 0.001530971727333963 2023-01-24 05:39:15.465994: step: 1640/530, loss: 0.0047542336396873 2023-01-24 05:39:16.511936: step: 1644/530, loss: 0.006223517470061779 2023-01-24 05:39:17.568546: step: 1648/530, loss: 0.0139730554074049 2023-01-24 05:39:18.617358: step: 1652/530, loss: 0.0036268585827201605 2023-01-24 05:39:19.667119: step: 1656/530, loss: 0.006946123205125332 2023-01-24 05:39:20.712153: step: 1660/530, loss: 0.006818384863436222 2023-01-24 05:39:21.752601: step: 1664/530, loss: 0.0011433502659201622 2023-01-24 05:39:22.813003: step: 1668/530, loss: 0.004938792437314987 2023-01-24 05:39:23.848923: step: 1672/530, loss: 0.011463537812232971 2023-01-24 05:39:24.890966: step: 1676/530, loss: 0.032061465084552765 2023-01-24 05:39:25.921057: step: 1680/530, loss: 0.002863953821361065 2023-01-24 05:39:26.972112: step: 1684/530, loss: 0.04139088839292526 2023-01-24 05:39:28.013568: step: 1688/530, loss: 0.008814378641545773 2023-01-24 05:39:29.065623: step: 1692/530, loss: 0.0033131532836705446 2023-01-24 05:39:30.114839: step: 1696/530, loss: 0.00244878395460546 2023-01-24 05:39:31.146395: step: 1700/530, loss: 0.006749260239303112 2023-01-24 05:39:32.194959: step: 1704/530, loss: 0.005634751170873642 2023-01-24 05:39:33.244145: step: 1708/530, loss: 0.005944405682384968 2023-01-24 05:39:34.274739: step: 1712/530, loss: 0.0054340241476893425 2023-01-24 05:39:35.322801: step: 1716/530, loss: 0.011103671975433826 2023-01-24 05:39:36.364752: step: 1720/530, loss: 0.005122414790093899 2023-01-24 05:39:37.394187: step: 1724/530, loss: 0.01340001355856657 2023-01-24 05:39:38.448593: step: 1728/530, loss: 0.0029655080288648605 2023-01-24 05:39:39.488996: step: 1732/530, loss: 0.002911247778683901 2023-01-24 05:39:40.515169: step: 1736/530, loss: 0.01641754060983658 2023-01-24 05:39:41.580773: step: 1740/530, loss: 0.00841789972037077 2023-01-24 05:39:42.619467: step: 1744/530, loss: 0.0006806628662161529 2023-01-24 05:39:43.663305: step: 1748/530, loss: 0.0027705375105142593 2023-01-24 05:39:44.705681: step: 1752/530, loss: 0.006467380095273256 2023-01-24 05:39:45.748387: step: 1756/530, loss: 0.005140830297023058 2023-01-24 05:39:46.782118: step: 1760/530, loss: 0.004015334416180849 2023-01-24 05:39:47.810557: step: 1764/530, loss: 0.0005897469818592072 2023-01-24 05:39:48.851437: step: 1768/530, loss: 0.022029118612408638 2023-01-24 05:39:49.891677: step: 1772/530, loss: 0.006759891286492348 2023-01-24 05:39:50.936770: step: 1776/530, loss: 0.005062441807240248 2023-01-24 05:39:51.977179: step: 1780/530, loss: 0.03204406052827835 2023-01-24 05:39:53.037289: step: 1784/530, loss: 0.02780924178659916 2023-01-24 05:39:54.077296: step: 1788/530, loss: 0.009049559943377972 2023-01-24 05:39:55.104877: step: 1792/530, loss: 0.025827880948781967 2023-01-24 05:39:56.167420: step: 1796/530, loss: 0.009122991934418678 2023-01-24 05:39:57.195859: step: 1800/530, loss: 0.002891652984544635 2023-01-24 05:39:58.225748: step: 1804/530, loss: 0.019659172743558884 2023-01-24 05:39:59.293637: step: 1808/530, loss: 0.0005233991541899741 2023-01-24 05:40:00.329499: step: 1812/530, loss: 0.024127474054694176 2023-01-24 05:40:01.387449: step: 1816/530, loss: 0.04506048560142517 2023-01-24 05:40:02.423748: step: 1820/530, loss: 0.007663419004529715 2023-01-24 05:40:03.476420: step: 1824/530, loss: 0.0012375907972455025 2023-01-24 05:40:04.533456: step: 1828/530, loss: 0.002767898142337799 2023-01-24 05:40:05.588822: step: 1832/530, loss: 0.007024152670055628 2023-01-24 05:40:06.628954: step: 1836/530, loss: 0.007125238422304392 2023-01-24 05:40:07.670992: step: 1840/530, loss: 0.000880287610925734 2023-01-24 05:40:08.711910: step: 1844/530, loss: 0.02423970401287079 2023-01-24 05:40:09.747306: step: 1848/530, loss: 0.0023451962042599916 2023-01-24 05:40:10.794453: step: 1852/530, loss: 0.015652643516659737 2023-01-24 05:40:11.839873: step: 1856/530, loss: 0.009162044152617455 2023-01-24 05:40:12.891944: step: 1860/530, loss: 0.005536372773349285 2023-01-24 05:40:13.943564: step: 1864/530, loss: 0.006407800130546093 2023-01-24 05:40:15.013259: step: 1868/530, loss: 0.003582555102184415 2023-01-24 05:40:16.066619: step: 1872/530, loss: 0.0066716293804347515 2023-01-24 05:40:17.102775: step: 1876/530, loss: 0.022897623479366302 2023-01-24 05:40:18.141556: step: 1880/530, loss: 0.028789767995476723 2023-01-24 05:40:19.185679: step: 1884/530, loss: 0.003493228694424033 2023-01-24 05:40:20.233643: step: 1888/530, loss: 0.028540266677737236 2023-01-24 05:40:21.284496: step: 1892/530, loss: 0.008012617006897926 2023-01-24 05:40:22.328600: step: 1896/530, loss: 0.004202555399388075 2023-01-24 05:40:23.389855: step: 1900/530, loss: 0.009900493547320366 2023-01-24 05:40:24.419850: step: 1904/530, loss: 0.0005783902597613633 2023-01-24 05:40:25.462584: step: 1908/530, loss: 0.006170824635773897 2023-01-24 05:40:26.500163: step: 1912/530, loss: 0.0012728653382509947 2023-01-24 05:40:27.532245: step: 1916/530, loss: 0.0021315414924174547 2023-01-24 05:40:28.588401: step: 1920/530, loss: 0.002017686842009425 2023-01-24 05:40:29.645295: step: 1924/530, loss: 0.008344687521457672 2023-01-24 05:40:30.690509: step: 1928/530, loss: 0.015048304572701454 2023-01-24 05:40:31.733636: step: 1932/530, loss: 0.025304270908236504 2023-01-24 05:40:32.771823: step: 1936/530, loss: 0.005524095147848129 2023-01-24 05:40:33.814405: step: 1940/530, loss: 0.01964718848466873 2023-01-24 05:40:34.850742: step: 1944/530, loss: 0.006864464376121759 2023-01-24 05:40:35.896462: step: 1948/530, loss: 0.02290772646665573 2023-01-24 05:40:36.931379: step: 1952/530, loss: 0.0013200819958001375 2023-01-24 05:40:37.964836: step: 1956/530, loss: 0.01248240564018488 2023-01-24 05:40:39.033621: step: 1960/530, loss: 0.013508937321603298 2023-01-24 05:40:40.068063: step: 1964/530, loss: 0.015507044270634651 2023-01-24 05:40:41.115882: step: 1968/530, loss: 0.005352470558136702 2023-01-24 05:40:42.155194: step: 1972/530, loss: 0.021453987807035446 2023-01-24 05:40:43.194381: step: 1976/530, loss: 0.0345342680811882 2023-01-24 05:40:44.234446: step: 1980/530, loss: 0.05825893208384514 2023-01-24 05:40:45.277084: step: 1984/530, loss: 0.01437149103730917 2023-01-24 05:40:46.331495: step: 1988/530, loss: 0.006067384500056505 2023-01-24 05:40:47.369920: step: 1992/530, loss: 0.01749325357377529 2023-01-24 05:40:48.412030: step: 1996/530, loss: 0.019947359338402748 2023-01-24 05:40:49.458782: step: 2000/530, loss: 0.04971623420715332 2023-01-24 05:40:50.498979: step: 2004/530, loss: 0.004467702936381102 2023-01-24 05:40:51.540882: step: 2008/530, loss: 0.006505491677671671 2023-01-24 05:40:52.586030: step: 2012/530, loss: 0.023121826350688934 2023-01-24 05:40:53.635066: step: 2016/530, loss: 0.003948783036321402 2023-01-24 05:40:54.656275: step: 2020/530, loss: 0.001281349454075098 2023-01-24 05:40:55.691030: step: 2024/530, loss: 0.003601230215281248 2023-01-24 05:40:56.733911: step: 2028/530, loss: 0.0015417259419336915 2023-01-24 05:40:57.787584: step: 2032/530, loss: 0.03109133429825306 2023-01-24 05:40:58.824045: step: 2036/530, loss: 0.0067815459333360195 2023-01-24 05:40:59.871862: step: 2040/530, loss: 0.003272899193689227 2023-01-24 05:41:00.920132: step: 2044/530, loss: 0.0023744083009660244 2023-01-24 05:41:01.969980: step: 2048/530, loss: 0.010213518515229225 2023-01-24 05:41:03.012351: step: 2052/530, loss: 0.039266642183065414 2023-01-24 05:41:04.064183: step: 2056/530, loss: 0.047216176986694336 2023-01-24 05:41:05.105475: step: 2060/530, loss: 0.003252866445109248 2023-01-24 05:41:06.153189: step: 2064/530, loss: 0.007022211793810129 2023-01-24 05:41:07.192266: step: 2068/530, loss: 0.020488189533352852 2023-01-24 05:41:08.242192: step: 2072/530, loss: 0.006667060777544975 2023-01-24 05:41:09.285276: step: 2076/530, loss: 0.026132578030228615 2023-01-24 05:41:10.322450: step: 2080/530, loss: 0.011762279085814953 2023-01-24 05:41:11.361289: step: 2084/530, loss: 0.010906804352998734 2023-01-24 05:41:12.406067: step: 2088/530, loss: 0.03486092761158943 2023-01-24 05:41:13.458162: step: 2092/530, loss: 0.006506910547614098 2023-01-24 05:41:14.506280: step: 2096/530, loss: 0.002649609697982669 2023-01-24 05:41:15.551573: step: 2100/530, loss: 0.009220363572239876 2023-01-24 05:41:16.602863: step: 2104/530, loss: 0.009778588078916073 2023-01-24 05:41:17.637221: step: 2108/530, loss: 0.021150244399905205 2023-01-24 05:41:18.671018: step: 2112/530, loss: 0.004198956768959761 2023-01-24 05:41:19.715907: step: 2116/530, loss: 0.026482384651899338 2023-01-24 05:41:20.742877: step: 2120/530, loss: 0.0015386679442599416 ================================================== Loss: 0.011 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37004213483146065, 'r': 0.3124644212523719, 'f1': 0.3388245884773662}, 'combined': 0.2496602230885856, 'stategy': 1, 'epoch': 3} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3778885314389228, 'r': 0.3900448720642558, 'f1': 0.3838704846729175}, 'combined': 0.29754554314360115, 'stategy': 1, 'epoch': 3} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3847625811688312, 'r': 0.3212439007861209, 'f1': 0.35014588565519283}, 'combined': 0.25800223153540525, 'stategy': 1, 'epoch': 3} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37210117320075786, 'r': 0.3673131066338364, 'f1': 0.3696916373890971}, 'combined': 0.2865552404642762, 'stategy': 1, 'epoch': 3} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38675608320634547, 'r': 0.329513247361763, 'f1': 0.3558472978681334}, 'combined': 0.2622032721133614, 'stategy': 1, 'epoch': 3} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36457016286531846, 'r': 0.36322983138419596, 'f1': 0.3638987629337065}, 'combined': 0.2820650698337821, 'stategy': 1, 'epoch': 3} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 3} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 3} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 3} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3738546380090498, 'r': 0.3135555028462998, 'f1': 0.34106037151702784}, 'combined': 0.25130764217044155, 'stategy': 1, 'epoch': 0} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36737558326918535, 'r': 0.3794979673183977, 'f1': 0.373338397064357}, 'combined': 0.28938191542787484, 'stategy': 1, 'epoch': 0} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 0} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 4 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 05:43:43.036361: step: 4/530, loss: 0.00698957359418273 2023-01-24 05:43:44.074178: step: 8/530, loss: 0.005577901378273964 2023-01-24 05:43:45.130264: step: 12/530, loss: 0.009759383276104927 2023-01-24 05:43:46.178666: step: 16/530, loss: 0.00972414668649435 2023-01-24 05:43:47.230152: step: 20/530, loss: 0.003607033519074321 2023-01-24 05:43:48.307603: step: 24/530, loss: 0.0061666653491556644 2023-01-24 05:43:49.343559: step: 28/530, loss: 0.0029013005550950766 2023-01-24 05:43:50.387886: step: 32/530, loss: 0.003962663933634758 2023-01-24 05:43:51.416724: step: 36/530, loss: 0.0003702733083628118 2023-01-24 05:43:52.471262: step: 40/530, loss: 0.008750868029892445 2023-01-24 05:43:53.524295: step: 44/530, loss: 0.014158329926431179 2023-01-24 05:43:54.565496: step: 48/530, loss: 0.0054846820421516895 2023-01-24 05:43:55.618785: step: 52/530, loss: 0.03825291246175766 2023-01-24 05:43:56.653979: step: 56/530, loss: 0.009429728612303734 2023-01-24 05:43:57.703577: step: 60/530, loss: 0.08134341239929199 2023-01-24 05:43:58.742797: step: 64/530, loss: 0.04206562042236328 2023-01-24 05:43:59.795864: step: 68/530, loss: 0.03217296302318573 2023-01-24 05:44:00.838860: step: 72/530, loss: 0.025985410436987877 2023-01-24 05:44:01.890130: step: 76/530, loss: 0.0024232903961092234 2023-01-24 05:44:02.941628: step: 80/530, loss: 0.0027772444300353527 2023-01-24 05:44:03.960853: step: 84/530, loss: 0.007249601185321808 2023-01-24 05:44:04.994613: step: 88/530, loss: 0.008542601019144058 2023-01-24 05:44:06.037688: step: 92/530, loss: 0.014220623299479485 2023-01-24 05:44:07.084084: step: 96/530, loss: 0.0028424325864762068 2023-01-24 05:44:08.127591: step: 100/530, loss: 0.003984866198152304 2023-01-24 05:44:09.174274: step: 104/530, loss: 0.0011020959354937077 2023-01-24 05:44:10.223604: step: 108/530, loss: 0.01406872272491455 2023-01-24 05:44:11.276304: step: 112/530, loss: 0.018042679876089096 2023-01-24 05:44:12.335721: step: 116/530, loss: 0.01465566549450159 2023-01-24 05:44:13.376950: step: 120/530, loss: 0.022666359320282936 2023-01-24 05:44:14.415201: step: 124/530, loss: 0.006903568748384714 2023-01-24 05:44:15.460734: step: 128/530, loss: 0.016194384545087814 2023-01-24 05:44:16.497775: step: 132/530, loss: 0.00874684751033783 2023-01-24 05:44:17.535084: step: 136/530, loss: 0.013416357338428497 2023-01-24 05:44:18.574539: step: 140/530, loss: 0.028904622420668602 2023-01-24 05:44:19.630489: step: 144/530, loss: 0.010000213049352169 2023-01-24 05:44:20.689609: step: 148/530, loss: 0.03181010112166405 2023-01-24 05:44:21.735548: step: 152/530, loss: 0.009423215873539448 2023-01-24 05:44:22.782800: step: 156/530, loss: 0.019819416105747223 2023-01-24 05:44:23.826962: step: 160/530, loss: 0.020426101982593536 2023-01-24 05:44:24.869356: step: 164/530, loss: 0.005861368030309677 2023-01-24 05:44:25.921528: step: 168/530, loss: 0.0040320781990885735 2023-01-24 05:44:27.013111: step: 172/530, loss: 0.0059257387183606625 2023-01-24 05:44:28.055888: step: 176/530, loss: 0.00250278995372355 2023-01-24 05:44:29.092871: step: 180/530, loss: 8.345173409907147e-05 2023-01-24 05:44:30.131818: step: 184/530, loss: 0.007993591018021107 2023-01-24 05:44:31.186928: step: 188/530, loss: 0.007652263157069683 2023-01-24 05:44:32.230867: step: 192/530, loss: 0.004316218197345734 2023-01-24 05:44:33.282794: step: 196/530, loss: 0.06565670669078827 2023-01-24 05:44:34.324691: step: 200/530, loss: 0.0024813583586364985 2023-01-24 05:44:35.364260: step: 204/530, loss: 0.005987337324768305 2023-01-24 05:44:36.423897: step: 208/530, loss: 0.04859894514083862 2023-01-24 05:44:37.488057: step: 212/530, loss: 0.006227625068277121 2023-01-24 05:44:38.540585: step: 216/530, loss: 0.0035669042263180017 2023-01-24 05:44:39.580309: step: 220/530, loss: 0.03454126417636871 2023-01-24 05:44:40.635935: step: 224/530, loss: 0.0043172771111130714 2023-01-24 05:44:41.673935: step: 228/530, loss: 0.015398088842630386 2023-01-24 05:44:42.734667: step: 232/530, loss: 0.009715782478451729 2023-01-24 05:44:43.797130: step: 236/530, loss: 0.006490217987447977 2023-01-24 05:44:44.857200: step: 240/530, loss: 0.036483947187662125 2023-01-24 05:44:45.902019: step: 244/530, loss: 0.0027672559954226017 2023-01-24 05:44:46.950639: step: 248/530, loss: 0.015252219513058662 2023-01-24 05:44:47.994074: step: 252/530, loss: 0.0074973339214921 2023-01-24 05:44:49.034903: step: 256/530, loss: 0.04847541078925133 2023-01-24 05:44:50.079154: step: 260/530, loss: 0.0017978476826101542 2023-01-24 05:44:51.110964: step: 264/530, loss: 0.004983450286090374 2023-01-24 05:44:52.152816: step: 268/530, loss: 0.017880983650684357 2023-01-24 05:44:53.191300: step: 272/530, loss: 0.008143497630953789 2023-01-24 05:44:54.227057: step: 276/530, loss: 0.0400056317448616 2023-01-24 05:44:55.261970: step: 280/530, loss: 0.03198184072971344 2023-01-24 05:44:56.303897: step: 284/530, loss: 0.008575517684221268 2023-01-24 05:44:57.347139: step: 288/530, loss: 0.004899682942777872 2023-01-24 05:44:58.392359: step: 292/530, loss: 0.016800422221422195 2023-01-24 05:44:59.439579: step: 296/530, loss: 0.023409012705087662 2023-01-24 05:45:00.494189: step: 300/530, loss: 0.00782209075987339 2023-01-24 05:45:01.541081: step: 304/530, loss: 0.04012562334537506 2023-01-24 05:45:02.593636: step: 308/530, loss: 0.006925216410309076 2023-01-24 05:45:03.640063: step: 312/530, loss: 0.01726115122437477 2023-01-24 05:45:04.679753: step: 316/530, loss: 0.006735904607921839 2023-01-24 05:45:05.725996: step: 320/530, loss: 0.004824697971343994 2023-01-24 05:45:06.783565: step: 324/530, loss: 0.005202784202992916 2023-01-24 05:45:07.827599: step: 328/530, loss: 0.02611328847706318 2023-01-24 05:45:08.887512: step: 332/530, loss: 0.004486046265810728 2023-01-24 05:45:09.941615: step: 336/530, loss: 0.0007102540112100542 2023-01-24 05:45:10.975297: step: 340/530, loss: 0.009318984113633633 2023-01-24 05:45:12.024366: step: 344/530, loss: 0.0221951212733984 2023-01-24 05:45:13.062258: step: 348/530, loss: 0.011044745333492756 2023-01-24 05:45:14.112404: step: 352/530, loss: 0.00498811574652791 2023-01-24 05:45:15.156204: step: 356/530, loss: 0.005252169445157051 2023-01-24 05:45:16.195863: step: 360/530, loss: 0.0043073296546936035 2023-01-24 05:45:17.244965: step: 364/530, loss: 0.02234904281795025 2023-01-24 05:45:18.310135: step: 368/530, loss: 0.021820997819304466 2023-01-24 05:45:19.367941: step: 372/530, loss: 0.010399678722023964 2023-01-24 05:45:20.402385: step: 376/530, loss: 0.0050969491712749004 2023-01-24 05:45:21.438445: step: 380/530, loss: 0.008448018692433834 2023-01-24 05:45:22.489447: step: 384/530, loss: 0.005333400797098875 2023-01-24 05:45:23.533480: step: 388/530, loss: 0.008766456507146358 2023-01-24 05:45:24.584960: step: 392/530, loss: 0.010591150261461735 2023-01-24 05:45:25.634655: step: 396/530, loss: 0.009006449021399021 2023-01-24 05:45:26.694003: step: 400/530, loss: 0.0032896576449275017 2023-01-24 05:45:27.747131: step: 404/530, loss: 0.021293066442012787 2023-01-24 05:45:28.790470: step: 408/530, loss: 0.05242776498198509 2023-01-24 05:45:29.834526: step: 412/530, loss: 3.434674727031961e-05 2023-01-24 05:45:30.878139: step: 416/530, loss: 0.01999284327030182 2023-01-24 05:45:31.930469: step: 420/530, loss: 0.0074043977074325085 2023-01-24 05:45:32.998009: step: 424/530, loss: 0.13366059958934784 2023-01-24 05:45:34.047946: step: 428/530, loss: 0.023255396634340286 2023-01-24 05:45:35.101642: step: 432/530, loss: 0.0004912642179988325 2023-01-24 05:45:36.151181: step: 436/530, loss: 0.011607680469751358 2023-01-24 05:45:37.217167: step: 440/530, loss: 0.0020752574782818556 2023-01-24 05:45:38.270293: step: 444/530, loss: 0.07099786400794983 2023-01-24 05:45:39.325845: step: 448/530, loss: 0.005907267332077026 2023-01-24 05:45:40.365362: step: 452/530, loss: 0.06996611505746841 2023-01-24 05:45:41.427162: step: 456/530, loss: 0.005881482269614935 2023-01-24 05:45:42.482958: step: 460/530, loss: 0.005062122363597155 2023-01-24 05:45:43.513210: step: 464/530, loss: 0.003372237551957369 2023-01-24 05:45:44.557369: step: 468/530, loss: 0.005257321987301111 2023-01-24 05:45:45.588557: step: 472/530, loss: 0.03172683343291283 2023-01-24 05:45:46.625335: step: 476/530, loss: 0.01225967239588499 2023-01-24 05:45:47.672642: step: 480/530, loss: 0.0013167110737413168 2023-01-24 05:45:48.733709: step: 484/530, loss: 0.003937763627618551 2023-01-24 05:45:49.807232: step: 488/530, loss: 0.007725742179900408 2023-01-24 05:45:50.832452: step: 492/530, loss: 0.006535510998219252 2023-01-24 05:45:51.878145: step: 496/530, loss: 0.017793122678995132 2023-01-24 05:45:52.932987: step: 500/530, loss: 0.022887732833623886 2023-01-24 05:45:53.972280: step: 504/530, loss: 0.005900170188397169 2023-01-24 05:45:55.020567: step: 508/530, loss: 0.008673862554132938 2023-01-24 05:45:56.056179: step: 512/530, loss: 0.037150681018829346 2023-01-24 05:45:57.096236: step: 516/530, loss: 0.013750494457781315 2023-01-24 05:45:58.148473: step: 520/530, loss: 0.010467853397130966 2023-01-24 05:45:59.185024: step: 524/530, loss: 0.0056411041878163815 2023-01-24 05:46:00.231335: step: 528/530, loss: 0.005132163409143686 2023-01-24 05:46:01.278914: step: 532/530, loss: 0.00888803694397211 2023-01-24 05:46:02.326278: step: 536/530, loss: 0.007849623449146748 2023-01-24 05:46:03.408240: step: 540/530, loss: 0.004741653800010681 2023-01-24 05:46:04.448663: step: 544/530, loss: 0.008709482848644257 2023-01-24 05:46:05.498929: step: 548/530, loss: 0.011547000147402287 2023-01-24 05:46:06.544419: step: 552/530, loss: 0.006960046011954546 2023-01-24 05:46:07.580824: step: 556/530, loss: 0.00825323723256588 2023-01-24 05:46:08.629466: step: 560/530, loss: 0.00787415076047182 2023-01-24 05:46:09.675124: step: 564/530, loss: 0.008960647508502007 2023-01-24 05:46:10.703851: step: 568/530, loss: 0.007930672727525234 2023-01-24 05:46:11.755105: step: 572/530, loss: 0.014611798338592052 2023-01-24 05:46:12.792444: step: 576/530, loss: 0.013681265525519848 2023-01-24 05:46:13.834378: step: 580/530, loss: 0.016878889873623848 2023-01-24 05:46:14.889536: step: 584/530, loss: 0.010972322896122932 2023-01-24 05:46:15.943869: step: 588/530, loss: 0.0035258731804788113 2023-01-24 05:46:16.985985: step: 592/530, loss: 0.0016698520630598068 2023-01-24 05:46:18.046560: step: 596/530, loss: 0.0011435960186645389 2023-01-24 05:46:19.097659: step: 600/530, loss: 0.010016154497861862 2023-01-24 05:46:20.148926: step: 604/530, loss: 0.0032938197255134583 2023-01-24 05:46:21.191951: step: 608/530, loss: 0.0033495163079351187 2023-01-24 05:46:22.235456: step: 612/530, loss: 0.014365960843861103 2023-01-24 05:46:23.295762: step: 616/530, loss: 0.0025987266562879086 2023-01-24 05:46:24.356258: step: 620/530, loss: 0.012022805400192738 2023-01-24 05:46:25.411011: step: 624/530, loss: 0.009118536487221718 2023-01-24 05:46:26.464673: step: 628/530, loss: 0.007564467843621969 2023-01-24 05:46:27.507378: step: 632/530, loss: 0.002989412983879447 2023-01-24 05:46:28.562156: step: 636/530, loss: 0.007266636472195387 2023-01-24 05:46:29.597045: step: 640/530, loss: 0.014965740032494068 2023-01-24 05:46:30.621554: step: 644/530, loss: 0.013009588234126568 2023-01-24 05:46:31.656619: step: 648/530, loss: 0.005896244663745165 2023-01-24 05:46:32.676008: step: 652/530, loss: 0.004902588203549385 2023-01-24 05:46:33.728730: step: 656/530, loss: 0.02602233737707138 2023-01-24 05:46:34.774066: step: 660/530, loss: 0.025441834703087807 2023-01-24 05:46:35.821190: step: 664/530, loss: 0.0050089797005057335 2023-01-24 05:46:36.856067: step: 668/530, loss: 0.00533172395080328 2023-01-24 05:46:37.896468: step: 672/530, loss: 0.017497049644589424 2023-01-24 05:46:38.945138: step: 676/530, loss: 0.006845802068710327 2023-01-24 05:46:39.994382: step: 680/530, loss: 0.04576035961508751 2023-01-24 05:46:41.036420: step: 684/530, loss: 0.017015686258673668 2023-01-24 05:46:42.089426: step: 688/530, loss: 0.013764607720077038 2023-01-24 05:46:43.144506: step: 692/530, loss: 0.0059730298817157745 2023-01-24 05:46:44.195407: step: 696/530, loss: 0.016906701028347015 2023-01-24 05:46:45.229348: step: 700/530, loss: 0.011254091747105122 2023-01-24 05:46:46.272040: step: 704/530, loss: 0.04165195673704147 2023-01-24 05:46:47.327510: step: 708/530, loss: 0.008709629997611046 2023-01-24 05:46:48.399170: step: 712/530, loss: 0.003495514625683427 2023-01-24 05:46:49.437594: step: 716/530, loss: 0.013519697822630405 2023-01-24 05:46:50.474262: step: 720/530, loss: 0.00479164207354188 2023-01-24 05:46:51.521921: step: 724/530, loss: 0.023748546838760376 2023-01-24 05:46:52.568147: step: 728/530, loss: 0.003291499335318804 2023-01-24 05:46:53.618613: step: 732/530, loss: 0.0074381339363753796 2023-01-24 05:46:54.654639: step: 736/530, loss: 0.006539748050272465 2023-01-24 05:46:55.709500: step: 740/530, loss: 0.017345279455184937 2023-01-24 05:46:56.748482: step: 744/530, loss: 0.0003344478609506041 2023-01-24 05:46:57.811969: step: 748/530, loss: 0.007867151871323586 2023-01-24 05:46:58.852992: step: 752/530, loss: 0.005007112864404917 2023-01-24 05:46:59.878453: step: 756/530, loss: 0.0016287514008581638 2023-01-24 05:47:00.928559: step: 760/530, loss: 0.09510177373886108 2023-01-24 05:47:01.950009: step: 764/530, loss: 0.005689023062586784 2023-01-24 05:47:02.990661: step: 768/530, loss: 0.012977197766304016 2023-01-24 05:47:04.033558: step: 772/530, loss: 0.03646525740623474 2023-01-24 05:47:05.093855: step: 776/530, loss: 0.003714514896273613 2023-01-24 05:47:06.141725: step: 780/530, loss: 0.0008592036901973188 2023-01-24 05:47:07.203655: step: 784/530, loss: 0.005687682423740625 2023-01-24 05:47:08.245824: step: 788/530, loss: 0.004032238852232695 2023-01-24 05:47:09.298884: step: 792/530, loss: 0.00727576669305563 2023-01-24 05:47:10.333315: step: 796/530, loss: 0.007024645805358887 2023-01-24 05:47:11.367827: step: 800/530, loss: 0.00732702761888504 2023-01-24 05:47:12.413817: step: 804/530, loss: 0.022994497790932655 2023-01-24 05:47:13.457002: step: 808/530, loss: 0.0047180429100990295 2023-01-24 05:47:14.512372: step: 812/530, loss: 0.01518941204994917 2023-01-24 05:47:15.548823: step: 816/530, loss: 0.033338144421577454 2023-01-24 05:47:16.579707: step: 820/530, loss: 0.0 2023-01-24 05:47:17.626844: step: 824/530, loss: 0.010284901596605778 2023-01-24 05:47:18.670061: step: 828/530, loss: 0.010736415162682533 2023-01-24 05:47:19.699528: step: 832/530, loss: 0.009313641116023064 2023-01-24 05:47:20.749905: step: 836/530, loss: 0.0029275002889335155 2023-01-24 05:47:21.806977: step: 840/530, loss: 0.003788512898609042 2023-01-24 05:47:22.840516: step: 844/530, loss: 0.017399154603481293 2023-01-24 05:47:23.896645: step: 848/530, loss: 0.02060185931622982 2023-01-24 05:47:24.974636: step: 852/530, loss: 0.010406752116978168 2023-01-24 05:47:26.010848: step: 856/530, loss: 0.04205852746963501 2023-01-24 05:47:27.042498: step: 860/530, loss: 0.0013028442626819015 2023-01-24 05:47:28.095943: step: 864/530, loss: 0.002421698998659849 2023-01-24 05:47:29.147008: step: 868/530, loss: 0.009311051107943058 2023-01-24 05:47:30.208377: step: 872/530, loss: 0.008731632493436337 2023-01-24 05:47:31.244821: step: 876/530, loss: 0.01109696738421917 2023-01-24 05:47:32.289184: step: 880/530, loss: 0.00536033371463418 2023-01-24 05:47:33.319819: step: 884/530, loss: 0.007589268498122692 2023-01-24 05:47:34.357979: step: 888/530, loss: 0.010429609566926956 2023-01-24 05:47:35.391521: step: 892/530, loss: 0.009333876892924309 2023-01-24 05:47:36.444682: step: 896/530, loss: 0.011744623072445393 2023-01-24 05:47:37.469728: step: 900/530, loss: 0.050074562430381775 2023-01-24 05:47:38.505607: step: 904/530, loss: 0.012248623184859753 2023-01-24 05:47:39.544588: step: 908/530, loss: 0.03647422045469284 2023-01-24 05:47:40.567271: step: 912/530, loss: 0.008958926424384117 2023-01-24 05:47:41.614437: step: 916/530, loss: 0.00616225553676486 2023-01-24 05:47:42.658986: step: 920/530, loss: 0.008525794371962547 2023-01-24 05:47:43.728636: step: 924/530, loss: 0.05312938243150711 2023-01-24 05:47:44.770200: step: 928/530, loss: 0.007054210640490055 2023-01-24 05:47:45.803399: step: 932/530, loss: 0.00624262448400259 2023-01-24 05:47:46.836873: step: 936/530, loss: 0.010174065828323364 2023-01-24 05:47:47.874927: step: 940/530, loss: 0.006507161073386669 2023-01-24 05:47:48.909148: step: 944/530, loss: 0.0018366253934800625 2023-01-24 05:47:49.949229: step: 948/530, loss: 0.005892733111977577 2023-01-24 05:47:51.001334: step: 952/530, loss: 0.017710620537400246 2023-01-24 05:47:52.040365: step: 956/530, loss: 0.0052134995348751545 2023-01-24 05:47:53.069924: step: 960/530, loss: 0.010730620473623276 2023-01-24 05:47:54.112999: step: 964/530, loss: 0.007666897028684616 2023-01-24 05:47:55.159378: step: 968/530, loss: 0.006504003424197435 2023-01-24 05:47:56.212441: step: 972/530, loss: 0.020299887284636497 2023-01-24 05:47:57.242149: step: 976/530, loss: 0.034470751881599426 2023-01-24 05:47:58.302790: step: 980/530, loss: 0.03596094623208046 2023-01-24 05:47:59.358885: step: 984/530, loss: 0.03155870363116264 2023-01-24 05:48:00.405178: step: 988/530, loss: 0.004506540019065142 2023-01-24 05:48:01.438183: step: 992/530, loss: 0.0012982550542801619 2023-01-24 05:48:02.477846: step: 996/530, loss: 0.004639551974833012 2023-01-24 05:48:03.520295: step: 1000/530, loss: 0.007976015098392963 2023-01-24 05:48:04.557205: step: 1004/530, loss: 0.0011813045712187886 2023-01-24 05:48:05.597703: step: 1008/530, loss: 0.035291992127895355 2023-01-24 05:48:06.644055: step: 1012/530, loss: 0.007459714077413082 2023-01-24 05:48:07.698399: step: 1016/530, loss: 0.002157620619982481 2023-01-24 05:48:08.743940: step: 1020/530, loss: 0.02274075336754322 2023-01-24 05:48:09.790697: step: 1024/530, loss: 0.006961097940802574 2023-01-24 05:48:10.845737: step: 1028/530, loss: 0.010232280939817429 2023-01-24 05:48:11.877545: step: 1032/530, loss: 0.04055550694465637 2023-01-24 05:48:12.906672: step: 1036/530, loss: 0.01339031383395195 2023-01-24 05:48:13.947590: step: 1040/530, loss: 0.004634765442460775 2023-01-24 05:48:14.989231: step: 1044/530, loss: 0.006842790171504021 2023-01-24 05:48:16.017180: step: 1048/530, loss: 0.016985837370157242 2023-01-24 05:48:17.046147: step: 1052/530, loss: 0.005740019958466291 2023-01-24 05:48:18.090090: step: 1056/530, loss: 0.005261383019387722 2023-01-24 05:48:19.123996: step: 1060/530, loss: 0.005717601627111435 2023-01-24 05:48:20.148594: step: 1064/530, loss: 0.005638803355395794 2023-01-24 05:48:21.200465: step: 1068/530, loss: 0.01046875212341547 2023-01-24 05:48:22.249667: step: 1072/530, loss: 0.017455007880926132 2023-01-24 05:48:23.285968: step: 1076/530, loss: 0.06218757480382919 2023-01-24 05:48:24.326770: step: 1080/530, loss: 0.005418209824711084 2023-01-24 05:48:25.371593: step: 1084/530, loss: 0.0048764487728476524 2023-01-24 05:48:26.420662: step: 1088/530, loss: 0.003680927213281393 2023-01-24 05:48:27.463545: step: 1092/530, loss: 0.01458392571657896 2023-01-24 05:48:28.500374: step: 1096/530, loss: 0.01482077594846487 2023-01-24 05:48:29.563677: step: 1100/530, loss: 0.009594163857400417 2023-01-24 05:48:30.620014: step: 1104/530, loss: 0.009059345349669456 2023-01-24 05:48:31.659656: step: 1108/530, loss: 0.005022795870900154 2023-01-24 05:48:32.694805: step: 1112/530, loss: 0.03085966967046261 2023-01-24 05:48:33.730454: step: 1116/530, loss: 0.02273603156208992 2023-01-24 05:48:34.783359: step: 1120/530, loss: 0.002015126636251807 2023-01-24 05:48:35.818160: step: 1124/530, loss: 0.004609286785125732 2023-01-24 05:48:36.857752: step: 1128/530, loss: 0.019310960546135902 2023-01-24 05:48:37.899339: step: 1132/530, loss: 0.003627246478572488 2023-01-24 05:48:38.922104: step: 1136/530, loss: 0.04110556095838547 2023-01-24 05:48:39.957759: step: 1140/530, loss: 0.04287181794643402 2023-01-24 05:48:40.992082: step: 1144/530, loss: 0.020180117338895798 2023-01-24 05:48:42.024984: step: 1148/530, loss: 0.007182359229773283 2023-01-24 05:48:43.085762: step: 1152/530, loss: 0.009614327922463417 2023-01-24 05:48:44.133055: step: 1156/530, loss: 0.013087702915072441 2023-01-24 05:48:45.179052: step: 1160/530, loss: 0.005982095841318369 2023-01-24 05:48:46.209648: step: 1164/530, loss: 0.017094234004616737 2023-01-24 05:48:47.267794: step: 1168/530, loss: 0.03535285219550133 2023-01-24 05:48:48.311315: step: 1172/530, loss: 0.005485684610903263 2023-01-24 05:48:49.344021: step: 1176/530, loss: 0.008174329996109009 2023-01-24 05:48:50.380808: step: 1180/530, loss: 0.054272785782814026 2023-01-24 05:48:51.441949: step: 1184/530, loss: 0.0036752077285200357 2023-01-24 05:48:52.488177: step: 1188/530, loss: 0.005187473725527525 2023-01-24 05:48:53.538766: step: 1192/530, loss: 0.009865966625511646 2023-01-24 05:48:54.573432: step: 1196/530, loss: 0.013367796316742897 2023-01-24 05:48:55.601882: step: 1200/530, loss: 0.0031492505222558975 2023-01-24 05:48:56.652467: step: 1204/530, loss: 0.0247766375541687 2023-01-24 05:48:57.700636: step: 1208/530, loss: 0.009023106656968594 2023-01-24 05:48:58.747177: step: 1212/530, loss: 0.017439616844058037 2023-01-24 05:48:59.796670: step: 1216/530, loss: 0.016809113323688507 2023-01-24 05:49:00.841885: step: 1220/530, loss: 0.010281943716108799 2023-01-24 05:49:01.884992: step: 1224/530, loss: 0.010823133401572704 2023-01-24 05:49:02.943128: step: 1228/530, loss: 0.0019613010808825493 2023-01-24 05:49:03.980388: step: 1232/530, loss: 0.01822686567902565 2023-01-24 05:49:05.050932: step: 1236/530, loss: 0.0029462017118930817 2023-01-24 05:49:06.097320: step: 1240/530, loss: 0.020956365391612053 2023-01-24 05:49:07.149067: step: 1244/530, loss: 0.0054284934885799885 2023-01-24 05:49:08.191663: step: 1248/530, loss: 0.012328865006566048 2023-01-24 05:49:09.233134: step: 1252/530, loss: 0.006256837397813797 2023-01-24 05:49:10.280568: step: 1256/530, loss: 0.017065048217773438 2023-01-24 05:49:11.319017: step: 1260/530, loss: 0.028776071965694427 2023-01-24 05:49:12.364654: step: 1264/530, loss: 0.01057056151330471 2023-01-24 05:49:13.410825: step: 1268/530, loss: 0.006096193566918373 2023-01-24 05:49:14.454826: step: 1272/530, loss: 0.008900323882699013 2023-01-24 05:49:15.499050: step: 1276/530, loss: 0.024897761642932892 2023-01-24 05:49:16.540537: step: 1280/530, loss: 0.004362307954579592 2023-01-24 05:49:17.587094: step: 1284/530, loss: 0.017800914123654366 2023-01-24 05:49:18.640831: step: 1288/530, loss: 0.004053147044032812 2023-01-24 05:49:19.729524: step: 1292/530, loss: 0.010714251548051834 2023-01-24 05:49:20.754034: step: 1296/530, loss: 0.003834869246929884 2023-01-24 05:49:21.782671: step: 1300/530, loss: 0.0013706920435652137 2023-01-24 05:49:22.813773: step: 1304/530, loss: 0.0031859204173088074 2023-01-24 05:49:23.853692: step: 1308/530, loss: 0.0012207464314997196 2023-01-24 05:49:24.899405: step: 1312/530, loss: 0.009991885162889957 2023-01-24 05:49:25.939733: step: 1316/530, loss: 0.015509245917201042 2023-01-24 05:49:26.990779: step: 1320/530, loss: 0.019073287025094032 2023-01-24 05:49:28.015997: step: 1324/530, loss: 0.0037361180875450373 2023-01-24 05:49:29.062404: step: 1328/530, loss: 0.006787933874875307 2023-01-24 05:49:30.118401: step: 1332/530, loss: 0.00792840775102377 2023-01-24 05:49:31.161492: step: 1336/530, loss: 0.006871415302157402 2023-01-24 05:49:32.231386: step: 1340/530, loss: 0.0063455612398684025 2023-01-24 05:49:33.294867: step: 1344/530, loss: 0.00801592506468296 2023-01-24 05:49:34.333134: step: 1348/530, loss: 0.005658675916492939 2023-01-24 05:49:35.373392: step: 1352/530, loss: 0.0009868519846349955 2023-01-24 05:49:36.407602: step: 1356/530, loss: 0.0038439419586211443 2023-01-24 05:49:37.447175: step: 1360/530, loss: 0.013685734011232853 2023-01-24 05:49:38.480575: step: 1364/530, loss: 0.008099840953946114 2023-01-24 05:49:39.527600: step: 1368/530, loss: 0.02620629221200943 2023-01-24 05:49:40.577530: step: 1372/530, loss: 0.007384863682091236 2023-01-24 05:49:41.604204: step: 1376/530, loss: 0.007157912943512201 2023-01-24 05:49:42.661065: step: 1380/530, loss: 0.009436335414648056 2023-01-24 05:49:43.700431: step: 1384/530, loss: 0.0024360492825508118 2023-01-24 05:49:44.730733: step: 1388/530, loss: 0.0035571043845266104 2023-01-24 05:49:45.774944: step: 1392/530, loss: 0.003238662611693144 2023-01-24 05:49:46.815570: step: 1396/530, loss: 0.010676134377717972 2023-01-24 05:49:47.851797: step: 1400/530, loss: 0.023820823058485985 2023-01-24 05:49:48.910051: step: 1404/530, loss: 0.007093852385878563 2023-01-24 05:49:49.953028: step: 1408/530, loss: 0.01626482978463173 2023-01-24 05:49:50.994760: step: 1412/530, loss: 0.007416965905576944 2023-01-24 05:49:52.031371: step: 1416/530, loss: 0.008428905159235 2023-01-24 05:49:53.059505: step: 1420/530, loss: 0.006196982692927122 2023-01-24 05:49:54.097893: step: 1424/530, loss: 0.007847960107028484 2023-01-24 05:49:55.158349: step: 1428/530, loss: 0.011245768517255783 2023-01-24 05:49:56.205187: step: 1432/530, loss: 0.009996861219406128 2023-01-24 05:49:57.235270: step: 1436/530, loss: 0.006398098077625036 2023-01-24 05:49:58.262051: step: 1440/530, loss: 0.007841511629521847 2023-01-24 05:49:59.308129: step: 1444/530, loss: 0.01365701574832201 2023-01-24 05:50:00.370514: step: 1448/530, loss: 0.0033150888048112392 2023-01-24 05:50:01.420333: step: 1452/530, loss: 0.006269114091992378 2023-01-24 05:50:02.485379: step: 1456/530, loss: 0.007052919827401638 2023-01-24 05:50:03.534787: step: 1460/530, loss: 0.009731998667120934 2023-01-24 05:50:04.592002: step: 1464/530, loss: 0.003838661126792431 2023-01-24 05:50:05.623583: step: 1468/530, loss: 0.01154538057744503 2023-01-24 05:50:06.654266: step: 1472/530, loss: 0.0013273765798658133 2023-01-24 05:50:07.692643: step: 1476/530, loss: 0.0021753162145614624 2023-01-24 05:50:08.740121: step: 1480/530, loss: 0.0069759986363351345 2023-01-24 05:50:09.798637: step: 1484/530, loss: 0.008999811485409737 2023-01-24 05:50:10.837787: step: 1488/530, loss: 0.0032044530380517244 2023-01-24 05:50:11.883473: step: 1492/530, loss: 0.014354582875967026 2023-01-24 05:50:12.926351: step: 1496/530, loss: 0.006890683434903622 2023-01-24 05:50:13.974754: step: 1500/530, loss: 0.02164403349161148 2023-01-24 05:50:15.015013: step: 1504/530, loss: 0.03095339424908161 2023-01-24 05:50:16.068954: step: 1508/530, loss: 0.0008790783467702568 2023-01-24 05:50:17.105450: step: 1512/530, loss: 0.04674437269568443 2023-01-24 05:50:18.160091: step: 1516/530, loss: 0.101894311606884 2023-01-24 05:50:19.208383: step: 1520/530, loss: 0.0021620166953653097 2023-01-24 05:50:20.262104: step: 1524/530, loss: 0.0021734475158154964 2023-01-24 05:50:21.314912: step: 1528/530, loss: 0.0014497135998681188 2023-01-24 05:50:22.371644: step: 1532/530, loss: 0.010232940316200256 2023-01-24 05:50:23.411129: step: 1536/530, loss: 0.0036849970929324627 2023-01-24 05:50:24.435058: step: 1540/530, loss: 0.0018424472073093057 2023-01-24 05:50:25.481755: step: 1544/530, loss: 0.05146528780460358 2023-01-24 05:50:26.517020: step: 1548/530, loss: 0.0035465096589177847 2023-01-24 05:50:27.559118: step: 1552/530, loss: 0.061646562069654465 2023-01-24 05:50:28.592780: step: 1556/530, loss: 0.0005200144951231778 2023-01-24 05:50:29.650453: step: 1560/530, loss: 0.01526939868927002 2023-01-24 05:50:30.694747: step: 1564/530, loss: 0.027888912707567215 2023-01-24 05:50:31.713916: step: 1568/530, loss: 0.05533529072999954 2023-01-24 05:50:32.756734: step: 1572/530, loss: 0.01628085970878601 2023-01-24 05:50:33.800835: step: 1576/530, loss: 0.00815799180418253 2023-01-24 05:50:34.850779: step: 1580/530, loss: 0.014769169501960278 2023-01-24 05:50:35.912080: step: 1584/530, loss: 0.005658401176333427 2023-01-24 05:50:36.959006: step: 1588/530, loss: 0.015470368787646294 2023-01-24 05:50:37.992818: step: 1592/530, loss: 0.008477414958178997 2023-01-24 05:50:39.042868: step: 1596/530, loss: 0.010669825598597527 2023-01-24 05:50:40.087456: step: 1600/530, loss: 0.009646205231547356 2023-01-24 05:50:41.143421: step: 1604/530, loss: 0.010238900780677795 2023-01-24 05:50:42.182668: step: 1608/530, loss: 0.008970411494374275 2023-01-24 05:50:43.221309: step: 1612/530, loss: 0.02410770393908024 2023-01-24 05:50:44.250199: step: 1616/530, loss: 0.002660715952515602 2023-01-24 05:50:45.302125: step: 1620/530, loss: 0.035264208912849426 2023-01-24 05:50:46.357786: step: 1624/530, loss: 0.040786709636449814 2023-01-24 05:50:47.423796: step: 1628/530, loss: 0.013235140591859818 2023-01-24 05:50:48.482300: step: 1632/530, loss: 0.003664294956251979 2023-01-24 05:50:49.518750: step: 1636/530, loss: 0.010146270506083965 2023-01-24 05:50:50.566339: step: 1640/530, loss: 0.01120872050523758 2023-01-24 05:50:51.611983: step: 1644/530, loss: 0.0021815954241901636 2023-01-24 05:50:52.666271: step: 1648/530, loss: 0.0029521456453949213 2023-01-24 05:50:53.707816: step: 1652/530, loss: 0.0017736885929480195 2023-01-24 05:50:54.739238: step: 1656/530, loss: 0.01834573969244957 2023-01-24 05:50:55.798702: step: 1660/530, loss: 0.011319626122713089 2023-01-24 05:50:56.853048: step: 1664/530, loss: 0.016198961064219475 2023-01-24 05:50:57.902403: step: 1668/530, loss: 0.056787099689245224 2023-01-24 05:50:58.944434: step: 1672/530, loss: 0.045961495488882065 2023-01-24 05:50:59.981222: step: 1676/530, loss: 0.0072120968252420425 2023-01-24 05:51:01.047378: step: 1680/530, loss: 0.023251408711075783 2023-01-24 05:51:02.105183: step: 1684/530, loss: 0.03631749376654625 2023-01-24 05:51:03.150971: step: 1688/530, loss: 0.007739008869975805 2023-01-24 05:51:04.194088: step: 1692/530, loss: 0.011212572455406189 2023-01-24 05:51:05.229839: step: 1696/530, loss: 0.0021334963385015726 2023-01-24 05:51:06.287342: step: 1700/530, loss: 0.00017072352056857198 2023-01-24 05:51:07.349232: step: 1704/530, loss: 0.0054739732295274734 2023-01-24 05:51:08.383397: step: 1708/530, loss: 0.010552710853517056 2023-01-24 05:51:09.434605: step: 1712/530, loss: 0.008474929258227348 2023-01-24 05:51:10.485518: step: 1716/530, loss: 0.13012246787548065 2023-01-24 05:51:11.532472: step: 1720/530, loss: 0.02956259623169899 2023-01-24 05:51:12.576509: step: 1724/530, loss: 0.0059948209673166275 2023-01-24 05:51:13.625030: step: 1728/530, loss: 0.017709113657474518 2023-01-24 05:51:14.675793: step: 1732/530, loss: 0.0005050949403084815 2023-01-24 05:51:15.725954: step: 1736/530, loss: 0.004136632662266493 2023-01-24 05:51:16.792458: step: 1740/530, loss: 0.008426767773926258 2023-01-24 05:51:17.846333: step: 1744/530, loss: 0.016573533415794373 2023-01-24 05:51:18.889049: step: 1748/530, loss: 0.00579869793727994 2023-01-24 05:51:19.928406: step: 1752/530, loss: 0.005031159613281488 2023-01-24 05:51:20.987228: step: 1756/530, loss: 0.003828752087429166 2023-01-24 05:51:22.043914: step: 1760/530, loss: 0.010850084945559502 2023-01-24 05:51:23.090864: step: 1764/530, loss: 0.010462482459843159 2023-01-24 05:51:24.140438: step: 1768/530, loss: 0.005388755816966295 2023-01-24 05:51:25.168050: step: 1772/530, loss: 0.005045648198574781 2023-01-24 05:51:26.210488: step: 1776/530, loss: 0.03065331280231476 2023-01-24 05:51:27.265299: step: 1780/530, loss: 0.015230027958750725 2023-01-24 05:51:28.300585: step: 1784/530, loss: 0.009330620057880878 2023-01-24 05:51:29.356149: step: 1788/530, loss: 0.01424208004027605 2023-01-24 05:51:30.391476: step: 1792/530, loss: 0.0177735835313797 2023-01-24 05:51:31.421406: step: 1796/530, loss: 0.0021712735760957003 2023-01-24 05:51:32.466304: step: 1800/530, loss: 0.02098984457552433 2023-01-24 05:51:33.512218: step: 1804/530, loss: 0.007077093701809645 2023-01-24 05:51:34.578384: step: 1808/530, loss: 0.014779459685087204 2023-01-24 05:51:35.616827: step: 1812/530, loss: 0.009713179431855679 2023-01-24 05:51:36.650396: step: 1816/530, loss: 0.007239634171128273 2023-01-24 05:51:37.692211: step: 1820/530, loss: 0.016949862241744995 2023-01-24 05:51:38.742440: step: 1824/530, loss: 0.006182401441037655 2023-01-24 05:51:39.792853: step: 1828/530, loss: 0.00745818205177784 2023-01-24 05:51:40.824065: step: 1832/530, loss: 0.005689422599971294 2023-01-24 05:51:41.874158: step: 1836/530, loss: 0.013964063487946987 2023-01-24 05:51:42.916804: step: 1840/530, loss: 0.013131942600011826 2023-01-24 05:51:43.967549: step: 1844/530, loss: 0.08743832260370255 2023-01-24 05:51:44.994385: step: 1848/530, loss: 0.04414644464850426 2023-01-24 05:51:46.055374: step: 1852/530, loss: 0.026749644428491592 2023-01-24 05:51:47.088182: step: 1856/530, loss: 0.009580439887940884 2023-01-24 05:51:48.135280: step: 1860/530, loss: 0.005677979905158281 2023-01-24 05:51:49.182842: step: 1864/530, loss: 0.03229353204369545 2023-01-24 05:51:50.219683: step: 1868/530, loss: 0.04599224776029587 2023-01-24 05:51:51.244472: step: 1872/530, loss: 0.011477844789624214 2023-01-24 05:51:52.298045: step: 1876/530, loss: 0.009884202852845192 2023-01-24 05:51:53.348131: step: 1880/530, loss: 0.05241717770695686 2023-01-24 05:51:54.413494: step: 1884/530, loss: 0.010632255114614964 2023-01-24 05:51:55.453053: step: 1888/530, loss: 0.024795083329081535 2023-01-24 05:51:56.478909: step: 1892/530, loss: 0.026442566886544228 2023-01-24 05:51:57.525766: step: 1896/530, loss: 0.01335377898067236 2023-01-24 05:51:58.553411: step: 1900/530, loss: 0.008220052346587181 2023-01-24 05:51:59.600086: step: 1904/530, loss: 0.0382801778614521 2023-01-24 05:52:00.647117: step: 1908/530, loss: 0.021652933210134506 2023-01-24 05:52:01.724312: step: 1912/530, loss: 0.007596184033900499 2023-01-24 05:52:02.787326: step: 1916/530, loss: 0.022892331704497337 2023-01-24 05:52:03.810633: step: 1920/530, loss: 0.02290131151676178 2023-01-24 05:52:04.848482: step: 1924/530, loss: 0.009573090821504593 2023-01-24 05:52:05.888181: step: 1928/530, loss: 0.01821368932723999 2023-01-24 05:52:06.941822: step: 1932/530, loss: 0.006589924450963736 2023-01-24 05:52:07.993193: step: 1936/530, loss: 0.009054798632860184 2023-01-24 05:52:09.047873: step: 1940/530, loss: 0.008845238015055656 2023-01-24 05:52:10.085817: step: 1944/530, loss: 0.012344438582658768 2023-01-24 05:52:11.126110: step: 1948/530, loss: 0.0037157577462494373 2023-01-24 05:52:12.184869: step: 1952/530, loss: 0.04312935099005699 2023-01-24 05:52:13.213408: step: 1956/530, loss: 0.011651946231722832 2023-01-24 05:52:14.245839: step: 1960/530, loss: 0.008804849348962307 2023-01-24 05:52:15.292987: step: 1964/530, loss: 0.006081140600144863 2023-01-24 05:52:16.330315: step: 1968/530, loss: 0.01485342625528574 2023-01-24 05:52:17.383858: step: 1972/530, loss: 0.05511125922203064 2023-01-24 05:52:18.419523: step: 1976/530, loss: 0.0005198437720537186 2023-01-24 05:52:19.465853: step: 1980/530, loss: 0.012522531673312187 2023-01-24 05:52:20.510243: step: 1984/530, loss: 0.005106591619551182 2023-01-24 05:52:21.556027: step: 1988/530, loss: 0.011177177540957928 2023-01-24 05:52:22.611669: step: 1992/530, loss: 0.10730155557394028 2023-01-24 05:52:23.661401: step: 1996/530, loss: 0.0010632263729348779 2023-01-24 05:52:24.725682: step: 2000/530, loss: 0.01684959977865219 2023-01-24 05:52:25.787084: step: 2004/530, loss: 0.009729632176458836 2023-01-24 05:52:26.832928: step: 2008/530, loss: 0.0021659997291862965 2023-01-24 05:52:27.867572: step: 2012/530, loss: 0.0 2023-01-24 05:52:28.916457: step: 2016/530, loss: 0.006851190701127052 2023-01-24 05:52:29.954817: step: 2020/530, loss: 0.008856294676661491 2023-01-24 05:52:30.995366: step: 2024/530, loss: 0.035453442484140396 2023-01-24 05:52:32.045856: step: 2028/530, loss: 0.004786839243024588 2023-01-24 05:52:33.082914: step: 2032/530, loss: 0.004009741358458996 2023-01-24 05:52:34.122389: step: 2036/530, loss: 0.0008362511289305985 2023-01-24 05:52:35.158096: step: 2040/530, loss: 0.006732499692589045 2023-01-24 05:52:36.217977: step: 2044/530, loss: 0.0007510983268730342 2023-01-24 05:52:37.259233: step: 2048/530, loss: 0.0034757957328110933 2023-01-24 05:52:38.295920: step: 2052/530, loss: 0.03197331726551056 2023-01-24 05:52:39.341481: step: 2056/530, loss: 0.020527182146906853 2023-01-24 05:52:40.381073: step: 2060/530, loss: 0.014108306728303432 2023-01-24 05:52:41.421843: step: 2064/530, loss: 0.00789572298526764 2023-01-24 05:52:42.448167: step: 2068/530, loss: 0.005245354492217302 2023-01-24 05:52:43.472731: step: 2072/530, loss: 0.02112613432109356 2023-01-24 05:52:44.526438: step: 2076/530, loss: 0.018814364448189735 2023-01-24 05:52:45.578121: step: 2080/530, loss: 0.02076384611427784 2023-01-24 05:52:46.646299: step: 2084/530, loss: 0.0627404972910881 2023-01-24 05:52:47.685785: step: 2088/530, loss: 0.005093692801892757 2023-01-24 05:52:48.745168: step: 2092/530, loss: 0.0432882159948349 2023-01-24 05:52:49.790819: step: 2096/530, loss: 0.035880811512470245 2023-01-24 05:52:50.838722: step: 2100/530, loss: 0.00565405422821641 2023-01-24 05:52:51.874465: step: 2104/530, loss: 0.051265835762023926 2023-01-24 05:52:52.909303: step: 2108/530, loss: 0.0059537808410823345 2023-01-24 05:52:53.948787: step: 2112/530, loss: 0.006259667221456766 2023-01-24 05:52:54.983533: step: 2116/530, loss: 0.0066326819360256195 2023-01-24 05:52:56.024403: step: 2120/530, loss: 0.026345986872911453 ================================================== Loss: 0.015 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.36950383771929823, 'r': 0.319722485768501, 'f1': 0.3428153611393693}, 'combined': 0.2526007924184826, 'stategy': 1, 'epoch': 4} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37742601309099055, 'r': 0.3923426661819029, 'f1': 0.38473981145192454}, 'combined': 0.2982193753837884, 'stategy': 1, 'epoch': 4} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3811305607769424, 'r': 0.32978280021686096, 'f1': 0.3536023107106525}, 'combined': 0.26054907104995445, 'stategy': 1, 'epoch': 4} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36785471839114864, 'r': 0.36616420957501283, 'f1': 0.36700751728937253}, 'combined': 0.2844747263199921, 'stategy': 1, 'epoch': 4} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3753322107351712, 'r': 0.3290388640600552, 'f1': 0.35066426968584247}, 'combined': 0.2583841987158839, 'stategy': 1, 'epoch': 4} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3599395568707655, 'r': 0.3609320372665489, 'f1': 0.360435113855902}, 'combined': 0.27938032748639297, 'stategy': 1, 'epoch': 4} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 4} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 4} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 4} New best chinese model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.36950383771929823, 'r': 0.319722485768501, 'f1': 0.3428153611393693}, 'combined': 0.2526007924184826, 'stategy': 1, 'epoch': 4} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37742601309099055, 'r': 0.3923426661819029, 'f1': 0.38473981145192454}, 'combined': 0.2982193753837884, 'stategy': 1, 'epoch': 4} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 4} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 5 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 05:55:29.472245: step: 4/530, loss: 0.005588268395513296 2023-01-24 05:55:30.498800: step: 8/530, loss: 0.06199086457490921 2023-01-24 05:55:31.531975: step: 12/530, loss: 0.008542483672499657 2023-01-24 05:55:32.572037: step: 16/530, loss: 0.012168132700026035 2023-01-24 05:55:33.632978: step: 20/530, loss: 0.00337317306548357 2023-01-24 05:55:34.684379: step: 24/530, loss: 0.0333375446498394 2023-01-24 05:55:35.712397: step: 28/530, loss: 0.007256587501615286 2023-01-24 05:55:36.745216: step: 32/530, loss: 0.00467006815597415 2023-01-24 05:55:37.779795: step: 36/530, loss: 0.020394522696733475 2023-01-24 05:55:38.815334: step: 40/530, loss: 0.00021476308756973594 2023-01-24 05:55:39.863666: step: 44/530, loss: 0.003353406907990575 2023-01-24 05:55:40.899360: step: 48/530, loss: 0.005317258648574352 2023-01-24 05:55:41.927516: step: 52/530, loss: 0.00396682508289814 2023-01-24 05:55:42.971935: step: 56/530, loss: 0.0380081981420517 2023-01-24 05:55:44.011897: step: 60/530, loss: 0.011497588828206062 2023-01-24 05:55:45.059260: step: 64/530, loss: 0.07676336914300919 2023-01-24 05:55:46.103537: step: 68/530, loss: 0.002930128015577793 2023-01-24 05:55:47.137283: step: 72/530, loss: 0.0007320598815567791 2023-01-24 05:55:48.163127: step: 76/530, loss: 0.002627731766551733 2023-01-24 05:55:49.208690: step: 80/530, loss: 0.009351525455713272 2023-01-24 05:55:50.249320: step: 84/530, loss: 0.05400629714131355 2023-01-24 05:55:51.308095: step: 88/530, loss: 0.006733783986419439 2023-01-24 05:55:52.351012: step: 92/530, loss: 0.00025184068363159895 2023-01-24 05:55:53.396419: step: 96/530, loss: 0.003704732283949852 2023-01-24 05:55:54.440244: step: 100/530, loss: 0.012821323238313198 2023-01-24 05:55:55.477931: step: 104/530, loss: 0.021979887038469315 2023-01-24 05:55:56.519897: step: 108/530, loss: 0.1744893342256546 2023-01-24 05:55:57.549720: step: 112/530, loss: 0.010326141491532326 2023-01-24 05:55:58.585010: step: 116/530, loss: 0.001342359697446227 2023-01-24 05:55:59.624951: step: 120/530, loss: 0.00981202907860279 2023-01-24 05:56:00.656203: step: 124/530, loss: 0.009443918243050575 2023-01-24 05:56:01.702093: step: 128/530, loss: 0.004539586137980223 2023-01-24 05:56:02.738198: step: 132/530, loss: 0.003658464876934886 2023-01-24 05:56:03.771944: step: 136/530, loss: 0.012751545757055283 2023-01-24 05:56:04.825231: step: 140/530, loss: 0.01059018261730671 2023-01-24 05:56:05.877445: step: 144/530, loss: 0.008634681813418865 2023-01-24 05:56:06.899520: step: 148/530, loss: 0.004486961755901575 2023-01-24 05:56:07.940139: step: 152/530, loss: 0.0006435240502469242 2023-01-24 05:56:08.972877: step: 156/530, loss: 0.005888973828405142 2023-01-24 05:56:09.998468: step: 160/530, loss: 0.009699084796011448 2023-01-24 05:56:11.064041: step: 164/530, loss: 0.007755785249173641 2023-01-24 05:56:12.102945: step: 168/530, loss: 0.0071268281899392605 2023-01-24 05:56:13.144225: step: 172/530, loss: 0.024319598451256752 2023-01-24 05:56:14.186602: step: 176/530, loss: 0.01250580232590437 2023-01-24 05:56:15.238800: step: 180/530, loss: 0.010109507478773594 2023-01-24 05:56:16.282831: step: 184/530, loss: 0.009292527101933956 2023-01-24 05:56:17.315911: step: 188/530, loss: 0.007427418604493141 2023-01-24 05:56:18.344067: step: 192/530, loss: 0.0013856547884643078 2023-01-24 05:56:19.393404: step: 196/530, loss: 0.018948283046483994 2023-01-24 05:56:20.423025: step: 200/530, loss: 0.01557439286261797 2023-01-24 05:56:21.448630: step: 204/530, loss: 0.007975871674716473 2023-01-24 05:56:22.488281: step: 208/530, loss: 0.004301536828279495 2023-01-24 05:56:23.525867: step: 212/530, loss: 0.009251746349036694 2023-01-24 05:56:24.557162: step: 216/530, loss: 0.0 2023-01-24 05:56:25.616326: step: 220/530, loss: 0.0011706381337717175 2023-01-24 05:56:26.654598: step: 224/530, loss: 0.009251845069229603 2023-01-24 05:56:27.701079: step: 228/530, loss: 0.038894303143024445 2023-01-24 05:56:28.737619: step: 232/530, loss: 0.00913916900753975 2023-01-24 05:56:29.771539: step: 236/530, loss: 0.001993473619222641 2023-01-24 05:56:30.815453: step: 240/530, loss: 0.025272438302636147 2023-01-24 05:56:31.850372: step: 244/530, loss: 0.012085416354238987 2023-01-24 05:56:32.890700: step: 248/530, loss: 0.07184196263551712 2023-01-24 05:56:33.954732: step: 252/530, loss: 0.00636153481900692 2023-01-24 05:56:34.999190: step: 256/530, loss: 0.013592966832220554 2023-01-24 05:56:36.064309: step: 260/530, loss: 0.0817423090338707 2023-01-24 05:56:37.142653: step: 264/530, loss: 0.0049986811354756355 2023-01-24 05:56:38.204843: step: 268/530, loss: 0.0133290383964777 2023-01-24 05:56:39.244899: step: 272/530, loss: 0.010724496096372604 2023-01-24 05:56:40.298433: step: 276/530, loss: 0.006141698453575373 2023-01-24 05:56:41.355742: step: 280/530, loss: 0.02279144525527954 2023-01-24 05:56:42.415062: step: 284/530, loss: 0.02106567658483982 2023-01-24 05:56:43.475750: step: 288/530, loss: 0.0033782399259507656 2023-01-24 05:56:44.531332: step: 292/530, loss: 0.002073576208204031 2023-01-24 05:56:45.585651: step: 296/530, loss: 0.017554903402924538 2023-01-24 05:56:46.643075: step: 300/530, loss: 0.002421154174953699 2023-01-24 05:56:47.681472: step: 304/530, loss: 0.008731690235435963 2023-01-24 05:56:48.742715: step: 308/530, loss: 0.005585075821727514 2023-01-24 05:56:49.809321: step: 312/530, loss: 0.007909399457275867 2023-01-24 05:56:50.852714: step: 316/530, loss: 0.01444508507847786 2023-01-24 05:56:51.888975: step: 320/530, loss: 0.0014222756726667285 2023-01-24 05:56:52.922989: step: 324/530, loss: 0.0058175381273031235 2023-01-24 05:56:53.993722: step: 328/530, loss: 0.008278501220047474 2023-01-24 05:56:55.024921: step: 332/530, loss: 0.006105876062065363 2023-01-24 05:56:56.064496: step: 336/530, loss: 0.014510361477732658 2023-01-24 05:56:57.151069: step: 340/530, loss: 0.009033264592289925 2023-01-24 05:56:58.211445: step: 344/530, loss: 0.016659408807754517 2023-01-24 05:56:59.264020: step: 348/530, loss: 0.014676532708108425 2023-01-24 05:57:00.308491: step: 352/530, loss: 0.01533645112067461 2023-01-24 05:57:01.362469: step: 356/530, loss: 0.005074299406260252 2023-01-24 05:57:02.419330: step: 360/530, loss: 0.008287280797958374 2023-01-24 05:57:03.478516: step: 364/530, loss: 0.007156094536185265 2023-01-24 05:57:04.524105: step: 368/530, loss: 0.0060427263379096985 2023-01-24 05:57:05.582539: step: 372/530, loss: 0.00333373062312603 2023-01-24 05:57:06.624384: step: 376/530, loss: 0.03617725521326065 2023-01-24 05:57:07.690420: step: 380/530, loss: 0.06736189126968384 2023-01-24 05:57:08.745799: step: 384/530, loss: 0.01101057231426239 2023-01-24 05:57:09.799784: step: 388/530, loss: 0.005865860264748335 2023-01-24 05:57:10.865675: step: 392/530, loss: 0.019206885248422623 2023-01-24 05:57:11.912665: step: 396/530, loss: 0.027501532807946205 2023-01-24 05:57:12.952062: step: 400/530, loss: 0.004797319415956736 2023-01-24 05:57:13.996989: step: 404/530, loss: 0.027632728219032288 2023-01-24 05:57:15.046639: step: 408/530, loss: 0.005168435163795948 2023-01-24 05:57:16.076644: step: 412/530, loss: 0.0024470994248986244 2023-01-24 05:57:17.138955: step: 416/530, loss: 0.008314166218042374 2023-01-24 05:57:18.184676: step: 420/530, loss: 0.011156322434544563 2023-01-24 05:57:19.230047: step: 424/530, loss: 0.00198349473066628 2023-01-24 05:57:20.288193: step: 428/530, loss: 0.013873168267309666 2023-01-24 05:57:21.339940: step: 432/530, loss: 0.002291059121489525 2023-01-24 05:57:22.395873: step: 436/530, loss: 0.0072277989238500595 2023-01-24 05:57:23.447039: step: 440/530, loss: 0.004856232553720474 2023-01-24 05:57:24.494314: step: 444/530, loss: 0.005774457938969135 2023-01-24 05:57:25.551228: step: 448/530, loss: 0.006547051481902599 2023-01-24 05:57:26.599760: step: 452/530, loss: 0.01283668540418148 2023-01-24 05:57:27.659734: step: 456/530, loss: 0.02289484441280365 2023-01-24 05:57:28.707980: step: 460/530, loss: 0.014524105936288834 2023-01-24 05:57:29.750960: step: 464/530, loss: 0.01727128215134144 2023-01-24 05:57:30.811076: step: 468/530, loss: 0.007598747964948416 2023-01-24 05:57:31.856592: step: 472/530, loss: 0.043174732476472855 2023-01-24 05:57:32.928037: step: 476/530, loss: 0.018201831728219986 2023-01-24 05:57:33.978651: step: 480/530, loss: 0.007098087575286627 2023-01-24 05:57:35.020688: step: 484/530, loss: 0.004643871448934078 2023-01-24 05:57:36.073006: step: 488/530, loss: 0.022589458152651787 2023-01-24 05:57:37.116041: step: 492/530, loss: 0.01867409609258175 2023-01-24 05:57:38.163169: step: 496/530, loss: 0.003510940819978714 2023-01-24 05:57:39.208136: step: 500/530, loss: 0.0043696747161448 2023-01-24 05:57:40.255561: step: 504/530, loss: 0.007139483001083136 2023-01-24 05:57:41.330757: step: 508/530, loss: 0.006248056888580322 2023-01-24 05:57:42.376154: step: 512/530, loss: 0.006899184547364712 2023-01-24 05:57:43.419915: step: 516/530, loss: 0.008954247459769249 2023-01-24 05:57:44.468803: step: 520/530, loss: 0.03826233372092247 2023-01-24 05:57:45.509071: step: 524/530, loss: 0.004296408034861088 2023-01-24 05:57:46.540255: step: 528/530, loss: 0.026388704776763916 2023-01-24 05:57:47.582691: step: 532/530, loss: 0.007237255573272705 2023-01-24 05:57:48.637013: step: 536/530, loss: 0.012714683078229427 2023-01-24 05:57:49.692827: step: 540/530, loss: 0.009270096197724342 2023-01-24 05:57:50.754444: step: 544/530, loss: 0.010957039892673492 2023-01-24 05:57:51.813002: step: 548/530, loss: 0.046413011848926544 2023-01-24 05:57:52.855141: step: 552/530, loss: 0.0012702905805781484 2023-01-24 05:57:53.913327: step: 556/530, loss: 0.01454729214310646 2023-01-24 05:57:54.955889: step: 560/530, loss: 0.0012946755159646273 2023-01-24 05:57:55.998459: step: 564/530, loss: 0.004580217879265547 2023-01-24 05:57:57.036575: step: 568/530, loss: 0.007749276235699654 2023-01-24 05:57:58.072541: step: 572/530, loss: 0.0048573557287454605 2023-01-24 05:57:59.112697: step: 576/530, loss: 0.00838461983948946 2023-01-24 05:58:00.138308: step: 580/530, loss: 4.731139415525831e-05 2023-01-24 05:58:01.176541: step: 584/530, loss: 0.008801799267530441 2023-01-24 05:58:02.220973: step: 588/530, loss: 0.005033318884670734 2023-01-24 05:58:03.258910: step: 592/530, loss: 0.006699038669466972 2023-01-24 05:58:04.300428: step: 596/530, loss: 0.010545856319367886 2023-01-24 05:58:05.348345: step: 600/530, loss: 0.009249220602214336 2023-01-24 05:58:06.385607: step: 604/530, loss: 0.005822946783155203 2023-01-24 05:58:07.416649: step: 608/530, loss: 0.004310784861445427 2023-01-24 05:58:08.462183: step: 612/530, loss: 1.7877981008496135e-05 2023-01-24 05:58:09.497175: step: 616/530, loss: 0.0038097696378827095 2023-01-24 05:58:10.551758: step: 620/530, loss: 0.005796156357973814 2023-01-24 05:58:11.620972: step: 624/530, loss: 0.006661856546998024 2023-01-24 05:58:12.689910: step: 628/530, loss: 0.0018134411657229066 2023-01-24 05:58:13.742411: step: 632/530, loss: 0.004046429414302111 2023-01-24 05:58:14.777514: step: 636/530, loss: 0.021363284438848495 2023-01-24 05:58:15.833222: step: 640/530, loss: 0.011556833051145077 2023-01-24 05:58:16.889809: step: 644/530, loss: 0.012669372372329235 2023-01-24 05:58:17.948841: step: 648/530, loss: 0.01908951997756958 2023-01-24 05:58:18.980295: step: 652/530, loss: 0.003526262938976288 2023-01-24 05:58:20.024879: step: 656/530, loss: 0.009629894979298115 2023-01-24 05:58:21.057911: step: 660/530, loss: 0.0016331829829141498 2023-01-24 05:58:22.105579: step: 664/530, loss: 0.01964084431529045 2023-01-24 05:58:23.142974: step: 668/530, loss: 0.004161123652011156 2023-01-24 05:58:24.175558: step: 672/530, loss: 0.011294153518974781 2023-01-24 05:58:25.207221: step: 676/530, loss: 0.0018205394735559821 2023-01-24 05:58:26.241056: step: 680/530, loss: 0.007117633707821369 2023-01-24 05:58:27.301186: step: 684/530, loss: 0.010359746403992176 2023-01-24 05:58:28.330271: step: 688/530, loss: 0.006559242028743029 2023-01-24 05:58:29.361949: step: 692/530, loss: 0.00043034047121182084 2023-01-24 05:58:30.417405: step: 696/530, loss: 0.0070377835072577 2023-01-24 05:58:31.457942: step: 700/530, loss: 0.003006778424605727 2023-01-24 05:58:32.517067: step: 704/530, loss: 0.021097030490636826 2023-01-24 05:58:33.560887: step: 708/530, loss: 0.005191988777369261 2023-01-24 05:58:34.599191: step: 712/530, loss: 0.005960002541542053 2023-01-24 05:58:35.639418: step: 716/530, loss: 0.006902558263391256 2023-01-24 05:58:36.694733: step: 720/530, loss: 0.010176354087889194 2023-01-24 05:58:37.730010: step: 724/530, loss: 0.002411438850685954 2023-01-24 05:58:38.796578: step: 728/530, loss: 0.004508199170231819 2023-01-24 05:58:39.834616: step: 732/530, loss: 0.006601941771805286 2023-01-24 05:58:40.892977: step: 736/530, loss: 0.006622927263379097 2023-01-24 05:58:41.957320: step: 740/530, loss: 0.01019946951419115 2023-01-24 05:58:42.986211: step: 744/530, loss: 0.001228116569109261 2023-01-24 05:58:44.044065: step: 748/530, loss: 0.00554271275177598 2023-01-24 05:58:45.084522: step: 752/530, loss: 0.006356098689138889 2023-01-24 05:58:46.128422: step: 756/530, loss: 0.009608251973986626 2023-01-24 05:58:47.167946: step: 760/530, loss: 0.009014172479510307 2023-01-24 05:58:48.199472: step: 764/530, loss: 0.005637074820697308 2023-01-24 05:58:49.234040: step: 768/530, loss: 0.014369937591254711 2023-01-24 05:58:50.271990: step: 772/530, loss: 0.008542876690626144 2023-01-24 05:58:51.323742: step: 776/530, loss: 0.009192418307065964 2023-01-24 05:58:52.361908: step: 780/530, loss: 0.0009707133867777884 2023-01-24 05:58:53.398099: step: 784/530, loss: 0.005935297347605228 2023-01-24 05:58:54.458474: step: 788/530, loss: 0.013970510102808475 2023-01-24 05:58:55.511222: step: 792/530, loss: 0.024999402463436127 2023-01-24 05:58:56.553646: step: 796/530, loss: 0.004415830131620169 2023-01-24 05:58:57.605115: step: 800/530, loss: 0.01320775505155325 2023-01-24 05:58:58.653431: step: 804/530, loss: 0.00629342021420598 2023-01-24 05:58:59.707127: step: 808/530, loss: 0.00999950710684061 2023-01-24 05:59:00.761371: step: 812/530, loss: 0.010659722611308098 2023-01-24 05:59:01.801683: step: 816/530, loss: 0.008501281030476093 2023-01-24 05:59:02.845642: step: 820/530, loss: 0.0007197453523986042 2023-01-24 05:59:03.899412: step: 824/530, loss: 0.01655275747179985 2023-01-24 05:59:04.924235: step: 828/530, loss: 5.6251541536767036e-05 2023-01-24 05:59:05.977344: step: 832/530, loss: 0.0009268919238820672 2023-01-24 05:59:07.041407: step: 836/530, loss: 0.004103783052414656 2023-01-24 05:59:08.087464: step: 840/530, loss: 0.004988683853298426 2023-01-24 05:59:09.120114: step: 844/530, loss: 0.012605680152773857 2023-01-24 05:59:10.162587: step: 848/530, loss: 0.006974476855248213 2023-01-24 05:59:11.206446: step: 852/530, loss: 0.005091514904052019 2023-01-24 05:59:12.259415: step: 856/530, loss: 0.0014694997807964683 2023-01-24 05:59:13.309091: step: 860/530, loss: 0.0010220871772617102 2023-01-24 05:59:14.376467: step: 864/530, loss: 0.001836717943660915 2023-01-24 05:59:15.435595: step: 868/530, loss: 0.005687267053872347 2023-01-24 05:59:16.494621: step: 872/530, loss: 0.004915875382721424 2023-01-24 05:59:17.544266: step: 876/530, loss: 0.019141381606459618 2023-01-24 05:59:18.580396: step: 880/530, loss: 1.2647478797589429e-05 2023-01-24 05:59:19.618478: step: 884/530, loss: 0.022044172510504723 2023-01-24 05:59:20.662534: step: 888/530, loss: 0.010193722322583199 2023-01-24 05:59:21.712991: step: 892/530, loss: 0.00859873741865158 2023-01-24 05:59:22.741303: step: 896/530, loss: 0.02680361270904541 2023-01-24 05:59:23.769393: step: 900/530, loss: 0.0014909657184034586 2023-01-24 05:59:24.805922: step: 904/530, loss: 0.017367621883749962 2023-01-24 05:59:25.848754: step: 908/530, loss: 0.005413647275418043 2023-01-24 05:59:26.896824: step: 912/530, loss: 0.01309147384017706 2023-01-24 05:59:27.970056: step: 916/530, loss: 0.010298328474164009 2023-01-24 05:59:29.007042: step: 920/530, loss: 0.0014911723555997014 2023-01-24 05:59:30.035455: step: 924/530, loss: 0.00562900910153985 2023-01-24 05:59:31.084664: step: 928/530, loss: 0.00012551721010822803 2023-01-24 05:59:32.123863: step: 932/530, loss: 0.016936399042606354 2023-01-24 05:59:33.178741: step: 936/530, loss: 0.017997879534959793 2023-01-24 05:59:34.231533: step: 940/530, loss: 0.011630039662122726 2023-01-24 05:59:35.264558: step: 944/530, loss: 0.004711678251624107 2023-01-24 05:59:36.317921: step: 948/530, loss: 0.008336941711604595 2023-01-24 05:59:37.368256: step: 952/530, loss: 0.02768378145992756 2023-01-24 05:59:38.407939: step: 956/530, loss: 0.016323048621416092 2023-01-24 05:59:39.457117: step: 960/530, loss: 0.014767490327358246 2023-01-24 05:59:40.497629: step: 964/530, loss: 0.017576850950717926 2023-01-24 05:59:41.559412: step: 968/530, loss: 0.0017638560384511948 2023-01-24 05:59:42.635159: step: 972/530, loss: 0.03149247169494629 2023-01-24 05:59:43.684222: step: 976/530, loss: 0.08389350771903992 2023-01-24 05:59:44.766063: step: 980/530, loss: 0.012167435139417648 2023-01-24 05:59:45.803084: step: 984/530, loss: 0.01404179260134697 2023-01-24 05:59:46.848844: step: 988/530, loss: 0.003598138689994812 2023-01-24 05:59:47.888362: step: 992/530, loss: 0.007787288166582584 2023-01-24 05:59:48.934329: step: 996/530, loss: 0.04942134767770767 2023-01-24 05:59:49.992121: step: 1000/530, loss: 0.037217091768980026 2023-01-24 05:59:51.045652: step: 1004/530, loss: 0.00025469358661212027 2023-01-24 05:59:52.096425: step: 1008/530, loss: 0.011966563761234283 2023-01-24 05:59:53.150572: step: 1012/530, loss: 0.0011575728422030807 2023-01-24 05:59:54.189613: step: 1016/530, loss: 0.04056147113442421 2023-01-24 05:59:55.242727: step: 1020/530, loss: 0.0110407043248415 2023-01-24 05:59:56.272746: step: 1024/530, loss: 0.01687813177704811 2023-01-24 05:59:57.336754: step: 1028/530, loss: 0.028553498908877373 2023-01-24 05:59:58.400888: step: 1032/530, loss: 0.008772153407335281 2023-01-24 05:59:59.458419: step: 1036/530, loss: 0.02754429168999195 2023-01-24 06:00:00.502106: step: 1040/530, loss: 0.012440082617104053 2023-01-24 06:00:01.558751: step: 1044/530, loss: 0.013174206018447876 2023-01-24 06:00:02.600955: step: 1048/530, loss: 0.01911246031522751 2023-01-24 06:00:03.650633: step: 1052/530, loss: 0.0011527083115652204 2023-01-24 06:00:04.695665: step: 1056/530, loss: 0.016724998131394386 2023-01-24 06:00:05.746947: step: 1060/530, loss: 0.005059492774307728 2023-01-24 06:00:06.783165: step: 1064/530, loss: 0.005888041108846664 2023-01-24 06:00:07.824641: step: 1068/530, loss: 0.011758263222873211 2023-01-24 06:00:08.877048: step: 1072/530, loss: 6.988779932726175e-05 2023-01-24 06:00:09.913529: step: 1076/530, loss: 0.012905214913189411 2023-01-24 06:00:10.963547: step: 1080/530, loss: 0.004845108836889267 2023-01-24 06:00:12.014739: step: 1084/530, loss: 0.002205712255090475 2023-01-24 06:00:13.043351: step: 1088/530, loss: 0.0022706834133714437 2023-01-24 06:00:14.083654: step: 1092/530, loss: 0.015068558044731617 2023-01-24 06:00:15.113560: step: 1096/530, loss: 0.054232239723205566 2023-01-24 06:00:16.163974: step: 1100/530, loss: 0.004397891461849213 2023-01-24 06:00:17.214907: step: 1104/530, loss: 0.008655865676701069 2023-01-24 06:00:18.252854: step: 1108/530, loss: 0.004208332393318415 2023-01-24 06:00:19.300254: step: 1112/530, loss: 0.04608648642897606 2023-01-24 06:00:20.328490: step: 1116/530, loss: 0.006368137430399656 2023-01-24 06:00:21.374918: step: 1120/530, loss: 0.0024866051971912384 2023-01-24 06:00:22.424338: step: 1124/530, loss: 0.010059923864901066 2023-01-24 06:00:23.462416: step: 1128/530, loss: 0.017094725742936134 2023-01-24 06:00:24.495329: step: 1132/530, loss: 0.009986259043216705 2023-01-24 06:00:25.524604: step: 1136/530, loss: 0.01738540641963482 2023-01-24 06:00:26.565360: step: 1140/530, loss: 0.014111127704381943 2023-01-24 06:00:27.623962: step: 1144/530, loss: 0.007241981569677591 2023-01-24 06:00:28.665097: step: 1148/530, loss: 0.04822762683033943 2023-01-24 06:00:29.720200: step: 1152/530, loss: 0.006277620326727629 2023-01-24 06:00:30.778288: step: 1156/530, loss: 0.0023210307117551565 2023-01-24 06:00:31.858345: step: 1160/530, loss: 0.04634594917297363 2023-01-24 06:00:32.920731: step: 1164/530, loss: 0.005923795979470015 2023-01-24 06:00:33.958053: step: 1168/530, loss: 0.011370973661541939 2023-01-24 06:00:35.008183: step: 1172/530, loss: 0.02970983274281025 2023-01-24 06:00:36.049795: step: 1176/530, loss: 0.0075255706906318665 2023-01-24 06:00:37.097001: step: 1180/530, loss: 0.0018460537539795041 2023-01-24 06:00:38.128316: step: 1184/530, loss: 0.003375509986653924 2023-01-24 06:00:39.197511: step: 1188/530, loss: 0.002060431521385908 2023-01-24 06:00:40.223459: step: 1192/530, loss: 0.004417150281369686 2023-01-24 06:00:41.264979: step: 1196/530, loss: 0.010483695194125175 2023-01-24 06:00:42.304424: step: 1200/530, loss: 0.014702011831104755 2023-01-24 06:00:43.359618: step: 1204/530, loss: 0.003159887855872512 2023-01-24 06:00:44.413411: step: 1208/530, loss: 0.008196812123060226 2023-01-24 06:00:45.442891: step: 1212/530, loss: 0.006565215531736612 2023-01-24 06:00:46.481921: step: 1216/530, loss: 0.01153595745563507 2023-01-24 06:00:47.533273: step: 1220/530, loss: 0.0017138427356258035 2023-01-24 06:00:48.561504: step: 1224/530, loss: 0.008832437917590141 2023-01-24 06:00:49.602065: step: 1228/530, loss: 0.0037844006437808275 2023-01-24 06:00:50.642686: step: 1232/530, loss: 0.016488144174218178 2023-01-24 06:00:51.714534: step: 1236/530, loss: 0.028776640072464943 2023-01-24 06:00:52.766106: step: 1240/530, loss: 0.004934842698276043 2023-01-24 06:00:53.785224: step: 1244/530, loss: 0.0015925107290968299 2023-01-24 06:00:54.828523: step: 1248/530, loss: 0.0024560329038649797 2023-01-24 06:00:55.875540: step: 1252/530, loss: 0.006669624708592892 2023-01-24 06:00:56.924659: step: 1256/530, loss: 0.002642344683408737 2023-01-24 06:00:57.990925: step: 1260/530, loss: 0.012166638858616352 2023-01-24 06:00:59.032310: step: 1264/530, loss: 0.002556038787588477 2023-01-24 06:01:00.089939: step: 1268/530, loss: 0.0019084386294707656 2023-01-24 06:01:01.126824: step: 1272/530, loss: 0.02241872251033783 2023-01-24 06:01:02.176985: step: 1276/530, loss: 0.005768246483057737 2023-01-24 06:01:03.239625: step: 1280/530, loss: 0.00721336342394352 2023-01-24 06:01:04.277531: step: 1284/530, loss: 0.0032619929406791925 2023-01-24 06:01:05.317610: step: 1288/530, loss: 0.002321878680959344 2023-01-24 06:01:06.357628: step: 1292/530, loss: 0.0 2023-01-24 06:01:07.420671: step: 1296/530, loss: 0.003975667990744114 2023-01-24 06:01:08.474781: step: 1300/530, loss: 0.0027384948916733265 2023-01-24 06:01:09.525614: step: 1304/530, loss: 0.009381299838423729 2023-01-24 06:01:10.573455: step: 1308/530, loss: 0.00651626056060195 2023-01-24 06:01:11.609544: step: 1312/530, loss: 0.01557151135057211 2023-01-24 06:01:12.656081: step: 1316/530, loss: 0.03151615336537361 2023-01-24 06:01:13.690926: step: 1320/530, loss: 0.004775182344019413 2023-01-24 06:01:14.735335: step: 1324/530, loss: 0.0051331715658307076 2023-01-24 06:01:15.790900: step: 1328/530, loss: 0.015781784430146217 2023-01-24 06:01:16.818639: step: 1332/530, loss: 0.006004722323268652 2023-01-24 06:01:17.863422: step: 1336/530, loss: 0.012165858410298824 2023-01-24 06:01:18.899028: step: 1340/530, loss: 0.0021781730465590954 2023-01-24 06:01:19.958625: step: 1344/530, loss: 0.017394790425896645 2023-01-24 06:01:20.999025: step: 1348/530, loss: 0.004634325858205557 2023-01-24 06:01:22.055308: step: 1352/530, loss: 0.004140722565352917 2023-01-24 06:01:23.118199: step: 1356/530, loss: 0.007242133375257254 2023-01-24 06:01:24.152396: step: 1360/530, loss: 0.0038441636133939028 2023-01-24 06:01:25.192082: step: 1364/530, loss: 0.00365601503290236 2023-01-24 06:01:26.216195: step: 1368/530, loss: 0.008653477765619755 2023-01-24 06:01:27.274714: step: 1372/530, loss: 0.06473550200462341 2023-01-24 06:01:28.325016: step: 1376/530, loss: 0.012365452945232391 2023-01-24 06:01:29.380400: step: 1380/530, loss: 0.01687469333410263 2023-01-24 06:01:30.421781: step: 1384/530, loss: 0.013735839165747166 2023-01-24 06:01:31.452531: step: 1388/530, loss: 0.002074249554425478 2023-01-24 06:01:32.495873: step: 1392/530, loss: 0.0066183325834572315 2023-01-24 06:01:33.541610: step: 1396/530, loss: 0.003992049489170313 2023-01-24 06:01:34.595182: step: 1400/530, loss: 0.01779647171497345 2023-01-24 06:01:35.649169: step: 1404/530, loss: 0.005528097972273827 2023-01-24 06:01:36.729242: step: 1408/530, loss: 0.007138720713555813 2023-01-24 06:01:37.778239: step: 1412/530, loss: 0.011370713822543621 2023-01-24 06:01:38.826857: step: 1416/530, loss: 0.013343335129320621 2023-01-24 06:01:39.874398: step: 1420/530, loss: 0.003445129841566086 2023-01-24 06:01:40.914641: step: 1424/530, loss: 0.03647959977388382 2023-01-24 06:01:41.970949: step: 1428/530, loss: 0.0046344357542693615 2023-01-24 06:01:43.009226: step: 1432/530, loss: 0.012319570407271385 2023-01-24 06:01:44.050114: step: 1436/530, loss: 0.006243827287107706 2023-01-24 06:01:45.096020: step: 1440/530, loss: 0.014569567516446114 2023-01-24 06:01:46.143928: step: 1444/530, loss: 0.038104668259620667 2023-01-24 06:01:47.170736: step: 1448/530, loss: 0.0027446846943348646 2023-01-24 06:01:48.213391: step: 1452/530, loss: 0.037536486983299255 2023-01-24 06:01:49.256779: step: 1456/530, loss: 0.0038887758273631334 2023-01-24 06:01:50.289883: step: 1460/530, loss: 0.005944808013737202 2023-01-24 06:01:51.331968: step: 1464/530, loss: 0.006518770940601826 2023-01-24 06:01:52.374606: step: 1468/530, loss: 0.006378414575010538 2023-01-24 06:01:53.417667: step: 1472/530, loss: 0.00516114104539156 2023-01-24 06:01:54.452460: step: 1476/530, loss: 0.00238236621953547 2023-01-24 06:01:55.493632: step: 1480/530, loss: 0.007914666086435318 2023-01-24 06:01:56.555655: step: 1484/530, loss: 0.021690787747502327 2023-01-24 06:01:57.600150: step: 1488/530, loss: 0.03436211124062538 2023-01-24 06:01:58.643752: step: 1492/530, loss: 0.00542786531150341 2023-01-24 06:01:59.699588: step: 1496/530, loss: 0.0016266766469925642 2023-01-24 06:02:00.742783: step: 1500/530, loss: 0.004417261108756065 2023-01-24 06:02:01.799758: step: 1504/530, loss: 0.010348916985094547 2023-01-24 06:02:02.837723: step: 1508/530, loss: 0.0024823001585900784 2023-01-24 06:02:03.865757: step: 1512/530, loss: 0.0027275504544377327 2023-01-24 06:02:04.906300: step: 1516/530, loss: 0.024256065487861633 2023-01-24 06:02:05.951177: step: 1520/530, loss: 0.006303762551397085 2023-01-24 06:02:06.998080: step: 1524/530, loss: 0.0005122361471876502 2023-01-24 06:02:08.038730: step: 1528/530, loss: 0.005714477971196175 2023-01-24 06:02:09.069770: step: 1532/530, loss: 0.0032499264925718307 2023-01-24 06:02:10.117607: step: 1536/530, loss: 0.0031902496702969074 2023-01-24 06:02:11.155365: step: 1540/530, loss: 0.006088098045438528 2023-01-24 06:02:12.193467: step: 1544/530, loss: 0.041882455348968506 2023-01-24 06:02:13.240605: step: 1548/530, loss: 0.012648779898881912 2023-01-24 06:02:14.266747: step: 1552/530, loss: 0.0029303147457540035 2023-01-24 06:02:15.300298: step: 1556/530, loss: 0.0025913789868354797 2023-01-24 06:02:16.345573: step: 1560/530, loss: 0.010696973651647568 2023-01-24 06:02:17.386961: step: 1564/530, loss: 0.013189993798732758 2023-01-24 06:02:18.438795: step: 1568/530, loss: 0.003158735577017069 2023-01-24 06:02:19.478717: step: 1572/530, loss: 0.010850224643945694 2023-01-24 06:02:20.521637: step: 1576/530, loss: 0.0022604234982281923 2023-01-24 06:02:21.562020: step: 1580/530, loss: 0.01447734422981739 2023-01-24 06:02:22.595690: step: 1584/530, loss: 0.002383883111178875 2023-01-24 06:02:23.653666: step: 1588/530, loss: 0.005349942948669195 2023-01-24 06:02:24.715231: step: 1592/530, loss: 0.010400950908660889 2023-01-24 06:02:25.791463: step: 1596/530, loss: 0.009962107054889202 2023-01-24 06:02:26.808246: step: 1600/530, loss: 0.0005176945705898106 2023-01-24 06:02:27.859540: step: 1604/530, loss: 0.003487328765913844 2023-01-24 06:02:28.902363: step: 1608/530, loss: 0.01664735935628414 2023-01-24 06:02:29.934582: step: 1612/530, loss: 0.00046591219143010676 2023-01-24 06:02:31.007916: step: 1616/530, loss: 0.022153649479150772 2023-01-24 06:02:32.050597: step: 1620/530, loss: 0.001370233716443181 2023-01-24 06:02:33.100098: step: 1624/530, loss: 0.013568615540862083 2023-01-24 06:02:34.163504: step: 1628/530, loss: 0.010257410816848278 2023-01-24 06:02:35.208003: step: 1632/530, loss: 0.0013606279389932752 2023-01-24 06:02:36.263382: step: 1636/530, loss: 0.010526888072490692 2023-01-24 06:02:37.320979: step: 1640/530, loss: 0.0003021125157829374 2023-01-24 06:02:38.376434: step: 1644/530, loss: 0.03822477161884308 2023-01-24 06:02:39.415702: step: 1648/530, loss: 0.0069490112364292145 2023-01-24 06:02:40.451730: step: 1652/530, loss: 0.008463256992399693 2023-01-24 06:02:41.512028: step: 1656/530, loss: 0.002760227071121335 2023-01-24 06:02:42.540921: step: 1660/530, loss: 0.003952574450522661 2023-01-24 06:02:43.589614: step: 1664/530, loss: 0.019917337223887444 2023-01-24 06:02:44.627824: step: 1668/530, loss: 0.0009388299658894539 2023-01-24 06:02:45.681225: step: 1672/530, loss: 0.0026818157639354467 2023-01-24 06:02:46.729611: step: 1676/530, loss: 0.0008446202846243978 2023-01-24 06:02:47.773913: step: 1680/530, loss: 0.003061462426558137 2023-01-24 06:02:48.832925: step: 1684/530, loss: 0.01259323488920927 2023-01-24 06:02:49.887762: step: 1688/530, loss: 0.003192199394106865 2023-01-24 06:02:50.922203: step: 1692/530, loss: 0.0030326182022690773 2023-01-24 06:02:51.958790: step: 1696/530, loss: 0.0023902729153633118 2023-01-24 06:02:53.009713: step: 1700/530, loss: 0.010590974241495132 2023-01-24 06:02:54.062421: step: 1704/530, loss: 0.005997471511363983 2023-01-24 06:02:55.108538: step: 1708/530, loss: 0.0042737917974591255 2023-01-24 06:02:56.147789: step: 1712/530, loss: 0.0019460093462839723 2023-01-24 06:02:57.199841: step: 1716/530, loss: 0.009023701772093773 2023-01-24 06:02:58.231646: step: 1720/530, loss: 0.03829607367515564 2023-01-24 06:02:59.287170: step: 1724/530, loss: 0.001464914996176958 2023-01-24 06:03:00.329153: step: 1728/530, loss: 0.011218001134693623 2023-01-24 06:03:01.380390: step: 1732/530, loss: 0.006468515843153 2023-01-24 06:03:02.414224: step: 1736/530, loss: 0.05774828791618347 2023-01-24 06:03:03.469664: step: 1740/530, loss: 0.004463072866201401 2023-01-24 06:03:04.509953: step: 1744/530, loss: 0.004707530606538057 2023-01-24 06:03:05.551267: step: 1748/530, loss: 0.00423012301325798 2023-01-24 06:03:06.588211: step: 1752/530, loss: 0.0026463803369551897 2023-01-24 06:03:07.622599: step: 1756/530, loss: 0.0012509971857070923 2023-01-24 06:03:08.655016: step: 1760/530, loss: 0.03683941438794136 2023-01-24 06:03:09.703548: step: 1764/530, loss: 0.004583033733069897 2023-01-24 06:03:10.759850: step: 1768/530, loss: 0.001848480082117021 2023-01-24 06:03:11.801777: step: 1772/530, loss: 0.005092152394354343 2023-01-24 06:03:12.867820: step: 1776/530, loss: 0.010181999765336514 2023-01-24 06:03:13.903311: step: 1780/530, loss: 0.004218610934913158 2023-01-24 06:03:14.940286: step: 1784/530, loss: 0.0066188001073896885 2023-01-24 06:03:16.010038: step: 1788/530, loss: 0.006293498445302248 2023-01-24 06:03:17.066383: step: 1792/530, loss: 0.029996046796441078 2023-01-24 06:03:18.124070: step: 1796/530, loss: 0.006235219072550535 2023-01-24 06:03:19.153953: step: 1800/530, loss: 0.0007102636736817658 2023-01-24 06:03:20.216131: step: 1804/530, loss: 0.01009336393326521 2023-01-24 06:03:21.254493: step: 1808/530, loss: 0.019660072401165962 2023-01-24 06:03:22.287139: step: 1812/530, loss: 0.0034724606666713953 2023-01-24 06:03:23.343655: step: 1816/530, loss: 4.8215253627859056e-05 2023-01-24 06:03:24.369830: step: 1820/530, loss: 0.0020423235837370157 2023-01-24 06:03:25.431228: step: 1824/530, loss: 0.0020411359146237373 2023-01-24 06:03:26.487802: step: 1828/530, loss: 0.0008384475950151682 2023-01-24 06:03:27.533035: step: 1832/530, loss: 0.007453765720129013 2023-01-24 06:03:28.574669: step: 1836/530, loss: 0.005854646675288677 2023-01-24 06:03:29.627886: step: 1840/530, loss: 0.01420413888990879 2023-01-24 06:03:30.661740: step: 1844/530, loss: 0.005356969777494669 2023-01-24 06:03:31.700702: step: 1848/530, loss: 0.004413146525621414 2023-01-24 06:03:32.756625: step: 1852/530, loss: 0.0024649128317832947 2023-01-24 06:03:33.815941: step: 1856/530, loss: 0.01569589413702488 2023-01-24 06:03:34.860879: step: 1860/530, loss: 0.005170603282749653 2023-01-24 06:03:35.931964: step: 1864/530, loss: 0.015741726383566856 2023-01-24 06:03:36.990776: step: 1868/530, loss: 0.003222364466637373 2023-01-24 06:03:38.047879: step: 1872/530, loss: 0.004273899830877781 2023-01-24 06:03:39.099578: step: 1876/530, loss: 0.005244630854576826 2023-01-24 06:03:40.153267: step: 1880/530, loss: 0.005790162831544876 2023-01-24 06:03:41.202992: step: 1884/530, loss: 0.004424300044775009 2023-01-24 06:03:42.244882: step: 1888/530, loss: 0.0076529355719685555 2023-01-24 06:03:43.291359: step: 1892/530, loss: 0.004454405978322029 2023-01-24 06:03:44.340795: step: 1896/530, loss: 0.0012347509618848562 2023-01-24 06:03:45.415079: step: 1900/530, loss: 0.004442939534783363 2023-01-24 06:03:46.444480: step: 1904/530, loss: 0.007836198434233665 2023-01-24 06:03:47.475317: step: 1908/530, loss: 0.006599419750273228 2023-01-24 06:03:48.543320: step: 1912/530, loss: 0.005424900911748409 2023-01-24 06:03:49.603373: step: 1916/530, loss: 0.023368019610643387 2023-01-24 06:03:50.639775: step: 1920/530, loss: 0.0005079061957076192 2023-01-24 06:03:51.683761: step: 1924/530, loss: 0.002876706188544631 2023-01-24 06:03:52.724908: step: 1928/530, loss: 0.002839681226760149 2023-01-24 06:03:53.758200: step: 1932/530, loss: 0.002800461370497942 2023-01-24 06:03:54.803388: step: 1936/530, loss: 0.0345260426402092 2023-01-24 06:03:55.837626: step: 1940/530, loss: 0.0011219825828447938 2023-01-24 06:03:56.871247: step: 1944/530, loss: 0.03704563155770302 2023-01-24 06:03:57.919889: step: 1948/530, loss: 0.0020183371379971504 2023-01-24 06:03:58.984025: step: 1952/530, loss: 0.007695924025028944 2023-01-24 06:04:00.038151: step: 1956/530, loss: 0.00744060892611742 2023-01-24 06:04:01.080950: step: 1960/530, loss: 0.006299425847828388 2023-01-24 06:04:02.123637: step: 1964/530, loss: 0.009902258403599262 2023-01-24 06:04:03.185328: step: 1968/530, loss: 0.030299803242087364 2023-01-24 06:04:04.228549: step: 1972/530, loss: 0.021792281419038773 2023-01-24 06:04:05.270662: step: 1976/530, loss: 0.009079894982278347 2023-01-24 06:04:06.312994: step: 1980/530, loss: 0.016156412661075592 2023-01-24 06:04:07.366370: step: 1984/530, loss: 0.0008829004946164787 2023-01-24 06:04:08.404852: step: 1988/530, loss: 0.009219007566571236 2023-01-24 06:04:09.447538: step: 1992/530, loss: 0.004383533261716366 2023-01-24 06:04:10.492135: step: 1996/530, loss: 0.004133886191993952 2023-01-24 06:04:11.531129: step: 2000/530, loss: 0.012615744024515152 2023-01-24 06:04:12.570681: step: 2004/530, loss: 0.0044347625225782394 2023-01-24 06:04:13.613284: step: 2008/530, loss: 0.00016376172425225377 2023-01-24 06:04:14.660106: step: 2012/530, loss: 0.0031638555228710175 2023-01-24 06:04:15.706781: step: 2016/530, loss: 0.0008808086859062314 2023-01-24 06:04:16.747636: step: 2020/530, loss: 0.0026555319782346487 2023-01-24 06:04:17.781180: step: 2024/530, loss: 0.01694948598742485 2023-01-24 06:04:18.823404: step: 2028/530, loss: 0.0021222829818725586 2023-01-24 06:04:19.873269: step: 2032/530, loss: 0.042453326284885406 2023-01-24 06:04:20.916838: step: 2036/530, loss: 2.66447068497655e-06 2023-01-24 06:04:21.952778: step: 2040/530, loss: 0.008571631275117397 2023-01-24 06:04:22.974747: step: 2044/530, loss: 0.004397754091769457 2023-01-24 06:04:24.018330: step: 2048/530, loss: 0.001480049453675747 2023-01-24 06:04:25.056800: step: 2052/530, loss: 0.004592315759509802 2023-01-24 06:04:26.098219: step: 2056/530, loss: 0.013568039983510971 2023-01-24 06:04:27.143906: step: 2060/530, loss: 0.005409645847976208 2023-01-24 06:04:28.187294: step: 2064/530, loss: 0.01585240475833416 2023-01-24 06:04:29.239973: step: 2068/530, loss: 0.005477391183376312 2023-01-24 06:04:30.279502: step: 2072/530, loss: 0.008745000697672367 2023-01-24 06:04:31.313172: step: 2076/530, loss: 0.0028602932579815388 2023-01-24 06:04:32.363946: step: 2080/530, loss: 0.027682442218065262 2023-01-24 06:04:33.419986: step: 2084/530, loss: 0.0026634125970304012 2023-01-24 06:04:34.473526: step: 2088/530, loss: 0.0068257697857916355 2023-01-24 06:04:35.522012: step: 2092/530, loss: 0.12185706198215485 2023-01-24 06:04:36.579048: step: 2096/530, loss: 0.0046238708309829235 2023-01-24 06:04:37.634994: step: 2100/530, loss: 0.011242169886827469 2023-01-24 06:04:38.671945: step: 2104/530, loss: 0.038506343960762024 2023-01-24 06:04:39.748463: step: 2108/530, loss: 0.002894774777814746 2023-01-24 06:04:40.803418: step: 2112/530, loss: 0.0052803680300712585 2023-01-24 06:04:41.844323: step: 2116/530, loss: 0.005777029786258936 2023-01-24 06:04:42.872622: step: 2120/530, loss: 0.001339518348686397 ================================================== Loss: 0.011 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37424715909090905, 'r': 0.3124644212523719, 'f1': 0.34057652533609095}, 'combined': 0.2509511239318565, 'stategy': 1, 'epoch': 5} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3799095807023327, 'r': 0.3907342102995499, 'f1': 0.3852458729550614}, 'combined': 0.2986116335823921, 'stategy': 1, 'epoch': 5} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.39336880300065236, 'r': 0.3269365004066143, 'f1': 0.3570891931902295}, 'combined': 0.26311835287701124, 'stategy': 1, 'epoch': 5} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3691424037724075, 'r': 0.361338841927954, 'f1': 0.3651989410289029}, 'combined': 0.28307286338125487, 'stategy': 1, 'epoch': 5} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38848653548019935, 'r': 0.329513247361763, 'f1': 0.35657799047155875}, 'combined': 0.2627416771895696, 'stategy': 1, 'epoch': 5} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36596083711111593, 'r': 0.3602426990312548, 'f1': 0.3630792557165402}, 'combined': 0.28142985371329915, 'stategy': 1, 'epoch': 5} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 5} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 5} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 5} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.36950383771929823, 'r': 0.319722485768501, 'f1': 0.3428153611393693}, 'combined': 0.2526007924184826, 'stategy': 1, 'epoch': 4} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37742601309099055, 'r': 0.3923426661819029, 'f1': 0.38473981145192454}, 'combined': 0.2982193753837884, 'stategy': 1, 'epoch': 4} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 4} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 6 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 06:07:02.319351: step: 4/530, loss: 0.002410094253718853 2023-01-24 06:07:03.374497: step: 8/530, loss: 0.007437431253492832 2023-01-24 06:07:04.426980: step: 12/530, loss: 0.00877330731600523 2023-01-24 06:07:05.476255: step: 16/530, loss: 0.01219247281551361 2023-01-24 06:07:06.518900: step: 20/530, loss: 0.010418952442705631 2023-01-24 06:07:07.576923: step: 24/530, loss: 0.00411903066560626 2023-01-24 06:07:08.612371: step: 28/530, loss: 0.003494005184620619 2023-01-24 06:07:09.649759: step: 32/530, loss: 0.01221332885324955 2023-01-24 06:07:10.693494: step: 36/530, loss: 0.0071880570612847805 2023-01-24 06:07:11.728665: step: 40/530, loss: 0.015654858201742172 2023-01-24 06:07:12.784927: step: 44/530, loss: 0.01211537141352892 2023-01-24 06:07:13.821602: step: 48/530, loss: 0.003388779703527689 2023-01-24 06:07:14.865623: step: 52/530, loss: 0.006029969546943903 2023-01-24 06:07:15.899010: step: 56/530, loss: 0.00984850525856018 2023-01-24 06:07:16.922930: step: 60/530, loss: 0.0013922890648245811 2023-01-24 06:07:17.960570: step: 64/530, loss: 0.005875272210687399 2023-01-24 06:07:18.993929: step: 68/530, loss: 0.006032685283571482 2023-01-24 06:07:20.028425: step: 72/530, loss: 0.0074692657217383385 2023-01-24 06:07:21.060829: step: 76/530, loss: 0.001431178068742156 2023-01-24 06:07:22.108199: step: 80/530, loss: 0.0010363295441493392 2023-01-24 06:07:23.152071: step: 84/530, loss: 0.0036098435521125793 2023-01-24 06:07:24.184646: step: 88/530, loss: 0.004584179725497961 2023-01-24 06:07:25.233226: step: 92/530, loss: 0.0020966327283531427 2023-01-24 06:07:26.290786: step: 96/530, loss: 0.019692474976181984 2023-01-24 06:07:27.340541: step: 100/530, loss: 0.003456499893218279 2023-01-24 06:07:28.392508: step: 104/530, loss: 0.028512200340628624 2023-01-24 06:07:29.426291: step: 108/530, loss: 0.005234116688370705 2023-01-24 06:07:30.457230: step: 112/530, loss: 0.021136388182640076 2023-01-24 06:07:31.524205: step: 116/530, loss: 0.003945980221033096 2023-01-24 06:07:32.574951: step: 120/530, loss: 0.02525639906525612 2023-01-24 06:07:33.638276: step: 124/530, loss: 0.007580672390758991 2023-01-24 06:07:34.707832: step: 128/530, loss: 0.0042554219253361225 2023-01-24 06:07:35.747528: step: 132/530, loss: 0.0026932593900710344 2023-01-24 06:07:36.797047: step: 136/530, loss: 0.015149188227951527 2023-01-24 06:07:37.843605: step: 140/530, loss: 0.009992536157369614 2023-01-24 06:07:38.888964: step: 144/530, loss: 0.05954030901193619 2023-01-24 06:07:39.933067: step: 148/530, loss: 0.004324452951550484 2023-01-24 06:07:40.960940: step: 152/530, loss: 0.0016933104488998652 2023-01-24 06:07:42.009307: step: 156/530, loss: 0.017377691343426704 2023-01-24 06:07:43.065804: step: 160/530, loss: 0.013133893720805645 2023-01-24 06:07:44.108637: step: 164/530, loss: 0.010859663598239422 2023-01-24 06:07:45.147019: step: 168/530, loss: 0.006150545086711645 2023-01-24 06:07:46.189632: step: 172/530, loss: 0.002983695827424526 2023-01-24 06:07:47.227776: step: 176/530, loss: 0.003486424218863249 2023-01-24 06:07:48.277721: step: 180/530, loss: 0.007634737063199282 2023-01-24 06:07:49.313024: step: 184/530, loss: 0.0019673083443194628 2023-01-24 06:07:50.359417: step: 188/530, loss: 0.037448983639478683 2023-01-24 06:07:51.395784: step: 192/530, loss: 0.005233213305473328 2023-01-24 06:07:52.459137: step: 196/530, loss: 0.008048838004469872 2023-01-24 06:07:53.498352: step: 200/530, loss: 0.009631250984966755 2023-01-24 06:07:54.565637: step: 204/530, loss: 0.0036192014813423157 2023-01-24 06:07:55.591276: step: 208/530, loss: 0.00941761676222086 2023-01-24 06:07:56.648035: step: 212/530, loss: 0.007438240107148886 2023-01-24 06:07:57.707617: step: 216/530, loss: 0.009174337610602379 2023-01-24 06:07:58.759152: step: 220/530, loss: 0.012814212590456009 2023-01-24 06:07:59.806290: step: 224/530, loss: 0.003169468604028225 2023-01-24 06:08:00.868780: step: 228/530, loss: 0.01477832067757845 2023-01-24 06:08:01.917725: step: 232/530, loss: 0.004762791097164154 2023-01-24 06:08:02.976926: step: 236/530, loss: 0.0009118078742176294 2023-01-24 06:08:04.022340: step: 240/530, loss: 0.0076090204529464245 2023-01-24 06:08:05.047575: step: 244/530, loss: 0.01418292336165905 2023-01-24 06:08:06.093705: step: 248/530, loss: 0.002979577984660864 2023-01-24 06:08:07.127472: step: 252/530, loss: 0.016973827034235 2023-01-24 06:08:08.173851: step: 256/530, loss: 0.03841639310121536 2023-01-24 06:08:09.217495: step: 260/530, loss: 0.005691807251423597 2023-01-24 06:08:10.262797: step: 264/530, loss: 0.012516610324382782 2023-01-24 06:08:11.306468: step: 268/530, loss: 0.004631086718291044 2023-01-24 06:08:12.352556: step: 272/530, loss: 0.00608882075175643 2023-01-24 06:08:13.398401: step: 276/530, loss: 0.007790985982865095 2023-01-24 06:08:14.427388: step: 280/530, loss: 0.0038460693322122097 2023-01-24 06:08:15.482227: step: 284/530, loss: 0.010678712278604507 2023-01-24 06:08:16.528193: step: 288/530, loss: 0.006827929522842169 2023-01-24 06:08:17.566136: step: 292/530, loss: 0.009913576766848564 2023-01-24 06:08:18.622623: step: 296/530, loss: 0.007829931564629078 2023-01-24 06:08:19.674791: step: 300/530, loss: 0.007564726285636425 2023-01-24 06:08:20.724379: step: 304/530, loss: 0.0016680812695994973 2023-01-24 06:08:21.770788: step: 308/530, loss: 0.0019515500171110034 2023-01-24 06:08:22.821769: step: 312/530, loss: 0.006295766215771437 2023-01-24 06:08:23.873491: step: 316/530, loss: 0.014552712440490723 2023-01-24 06:08:24.936168: step: 320/530, loss: 0.015734106302261353 2023-01-24 06:08:25.985316: step: 324/530, loss: 0.029018845409154892 2023-01-24 06:08:27.035921: step: 328/530, loss: 0.002421098994091153 2023-01-24 06:08:28.072872: step: 332/530, loss: 0.007607277948409319 2023-01-24 06:08:29.145659: step: 336/530, loss: 0.008062227629125118 2023-01-24 06:08:30.191104: step: 340/530, loss: 0.002171614672988653 2023-01-24 06:08:31.239646: step: 344/530, loss: 0.005242005456238985 2023-01-24 06:08:32.311703: step: 348/530, loss: 0.03092706948518753 2023-01-24 06:08:33.346019: step: 352/530, loss: 0.0011545714223757386 2023-01-24 06:08:34.395208: step: 356/530, loss: 0.014324848540127277 2023-01-24 06:08:35.452666: step: 360/530, loss: 0.0010595325147733092 2023-01-24 06:08:36.528922: step: 364/530, loss: 0.00783079955726862 2023-01-24 06:08:37.588963: step: 368/530, loss: 0.02011287398636341 2023-01-24 06:08:38.632755: step: 372/530, loss: 0.008472003042697906 2023-01-24 06:08:39.691731: step: 376/530, loss: 0.004476419184356928 2023-01-24 06:08:40.743632: step: 380/530, loss: 0.002901660744100809 2023-01-24 06:08:41.790304: step: 384/530, loss: 0.004274390172213316 2023-01-24 06:08:42.838827: step: 388/530, loss: 0.007560750935226679 2023-01-24 06:08:43.899526: step: 392/530, loss: 0.008412742987275124 2023-01-24 06:08:44.934461: step: 396/530, loss: 0.002534314524382353 2023-01-24 06:08:45.981398: step: 400/530, loss: 0.0003153608995489776 2023-01-24 06:08:47.046981: step: 404/530, loss: 0.011063888669013977 2023-01-24 06:08:48.092053: step: 408/530, loss: 0.01040762010961771 2023-01-24 06:08:49.131516: step: 412/530, loss: 0.0013059860793873668 2023-01-24 06:08:50.165503: step: 416/530, loss: 0.002887838752940297 2023-01-24 06:08:51.226237: step: 420/530, loss: 0.003689179429784417 2023-01-24 06:08:52.287218: step: 424/530, loss: 0.006608184892684221 2023-01-24 06:08:53.345840: step: 428/530, loss: 0.0027508896309882402 2023-01-24 06:08:54.400484: step: 432/530, loss: 0.03888503462076187 2023-01-24 06:08:55.444460: step: 436/530, loss: 0.011268495582044125 2023-01-24 06:08:56.492484: step: 440/530, loss: 0.007574399467557669 2023-01-24 06:08:57.536916: step: 444/530, loss: 0.004419418517500162 2023-01-24 06:08:58.595324: step: 448/530, loss: 0.00045379874063655734 2023-01-24 06:08:59.635631: step: 452/530, loss: 0.0008488036692142487 2023-01-24 06:09:00.685587: step: 456/530, loss: 0.020364968106150627 2023-01-24 06:09:01.739134: step: 460/530, loss: 0.003826733212918043 2023-01-24 06:09:02.787799: step: 464/530, loss: 0.010594396851956844 2023-01-24 06:09:03.835291: step: 468/530, loss: 0.004512263927608728 2023-01-24 06:09:04.871040: step: 472/530, loss: 0.009800147265195847 2023-01-24 06:09:05.935616: step: 476/530, loss: 0.047890421003103256 2023-01-24 06:09:07.001210: step: 480/530, loss: 0.009888233616948128 2023-01-24 06:09:08.056315: step: 484/530, loss: 0.006917847320437431 2023-01-24 06:09:09.108113: step: 488/530, loss: 0.0050926003605127335 2023-01-24 06:09:10.143268: step: 492/530, loss: 0.0029797812458127737 2023-01-24 06:09:11.164694: step: 496/530, loss: 0.013459056615829468 2023-01-24 06:09:12.204903: step: 500/530, loss: 0.025662623345851898 2023-01-24 06:09:13.247645: step: 504/530, loss: 0.0174722783267498 2023-01-24 06:09:14.305629: step: 508/530, loss: 0.010713571682572365 2023-01-24 06:09:15.354577: step: 512/530, loss: 0.0031614790204912424 2023-01-24 06:09:16.406702: step: 516/530, loss: 0.005334513261914253 2023-01-24 06:09:17.451100: step: 520/530, loss: 0.003554454306140542 2023-01-24 06:09:18.502734: step: 524/530, loss: 0.015352113172411919 2023-01-24 06:09:19.546465: step: 528/530, loss: 0.01889767497777939 2023-01-24 06:09:20.590101: step: 532/530, loss: 0.023547524586319923 2023-01-24 06:09:21.622146: step: 536/530, loss: 0.022570954635739326 2023-01-24 06:09:22.669979: step: 540/530, loss: 0.002468713792040944 2023-01-24 06:09:23.719142: step: 544/530, loss: 0.0029661296866834164 2023-01-24 06:09:24.745163: step: 548/530, loss: 0.0069870189763605595 2023-01-24 06:09:25.789408: step: 552/530, loss: 0.012515907175838947 2023-01-24 06:09:26.835653: step: 556/530, loss: 0.006003242917358875 2023-01-24 06:09:27.867704: step: 560/530, loss: 0.006347401533275843 2023-01-24 06:09:28.914796: step: 564/530, loss: 0.004825224634259939 2023-01-24 06:09:29.959529: step: 568/530, loss: 0.010376404970884323 2023-01-24 06:09:31.014087: step: 572/530, loss: 0.00442598108202219 2023-01-24 06:09:32.047347: step: 576/530, loss: 0.0035153068602085114 2023-01-24 06:09:33.106779: step: 580/530, loss: 0.001959670102223754 2023-01-24 06:09:34.155620: step: 584/530, loss: 0.0016146284760907292 2023-01-24 06:09:35.200323: step: 588/530, loss: 0.03220200538635254 2023-01-24 06:09:36.250181: step: 592/530, loss: 0.006691142916679382 2023-01-24 06:09:37.301907: step: 596/530, loss: 0.007411698345094919 2023-01-24 06:09:38.347362: step: 600/530, loss: 0.022594882175326347 2023-01-24 06:09:39.387983: step: 604/530, loss: 0.019872277975082397 2023-01-24 06:09:40.430669: step: 608/530, loss: 0.004766772501170635 2023-01-24 06:09:41.487714: step: 612/530, loss: 0.001640079659409821 2023-01-24 06:09:42.533882: step: 616/530, loss: 0.026924069970846176 2023-01-24 06:09:43.581003: step: 620/530, loss: 0.004269296769052744 2023-01-24 06:09:44.605004: step: 624/530, loss: 0.032938603311777115 2023-01-24 06:09:45.670658: step: 628/530, loss: 0.07112736999988556 2023-01-24 06:09:46.718757: step: 632/530, loss: 0.002609388902783394 2023-01-24 06:09:47.771294: step: 636/530, loss: 0.005671422462910414 2023-01-24 06:09:48.799656: step: 640/530, loss: 0.010422873310744762 2023-01-24 06:09:49.834516: step: 644/530, loss: 0.004011990502476692 2023-01-24 06:09:50.867199: step: 648/530, loss: 0.004823459777981043 2023-01-24 06:09:51.903571: step: 652/530, loss: 0.0007633664645254612 2023-01-24 06:09:52.955976: step: 656/530, loss: 0.005875679198652506 2023-01-24 06:09:54.005848: step: 660/530, loss: 0.00778320524841547 2023-01-24 06:09:55.044036: step: 664/530, loss: 0.007265261374413967 2023-01-24 06:09:56.077258: step: 668/530, loss: 0.016020778566598892 2023-01-24 06:09:57.108183: step: 672/530, loss: 0.00456432206556201 2023-01-24 06:09:58.139039: step: 676/530, loss: 0.004717620089650154 2023-01-24 06:09:59.197253: step: 680/530, loss: 0.004241175018250942 2023-01-24 06:10:00.233034: step: 684/530, loss: 0.0016837397124618292 2023-01-24 06:10:01.273414: step: 688/530, loss: 0.0077882069163024426 2023-01-24 06:10:02.317655: step: 692/530, loss: 0.004180263262242079 2023-01-24 06:10:03.391427: step: 696/530, loss: 0.0011722301132977009 2023-01-24 06:10:04.434451: step: 700/530, loss: 0.003927664831280708 2023-01-24 06:10:05.475600: step: 704/530, loss: 0.003746821777895093 2023-01-24 06:10:06.531519: step: 708/530, loss: 0.010402302257716656 2023-01-24 06:10:07.574890: step: 712/530, loss: 0.003486238420009613 2023-01-24 06:10:08.615261: step: 716/530, loss: 0.007428276818245649 2023-01-24 06:10:09.674648: step: 720/530, loss: 0.0062630134634673595 2023-01-24 06:10:10.702465: step: 724/530, loss: 0.006969220004975796 2023-01-24 06:10:11.744727: step: 728/530, loss: 0.0075798118487000465 2023-01-24 06:10:12.808521: step: 732/530, loss: 0.004669481422752142 2023-01-24 06:10:13.866098: step: 736/530, loss: 0.003979456145316362 2023-01-24 06:10:14.901816: step: 740/530, loss: 0.0 2023-01-24 06:10:15.965147: step: 744/530, loss: 0.008986570872366428 2023-01-24 06:10:17.008736: step: 748/530, loss: 0.00022098649060353637 2023-01-24 06:10:18.050264: step: 752/530, loss: 0.014801819808781147 2023-01-24 06:10:19.092463: step: 756/530, loss: 0.00024320901138707995 2023-01-24 06:10:20.125327: step: 760/530, loss: 0.010732698254287243 2023-01-24 06:10:21.166424: step: 764/530, loss: 0.0075147259049117565 2023-01-24 06:10:22.202852: step: 768/530, loss: 0.005018957890570164 2023-01-24 06:10:23.233365: step: 772/530, loss: 0.013307273387908936 2023-01-24 06:10:24.284085: step: 776/530, loss: 0.008007578551769257 2023-01-24 06:10:25.342701: step: 780/530, loss: 0.009756868705153465 2023-01-24 06:10:26.408427: step: 784/530, loss: 0.008467484265565872 2023-01-24 06:10:27.442858: step: 788/530, loss: 0.004501370247453451 2023-01-24 06:10:28.491427: step: 792/530, loss: 0.003742700908333063 2023-01-24 06:10:29.526103: step: 796/530, loss: 0.012340862303972244 2023-01-24 06:10:30.570143: step: 800/530, loss: 0.016069967299699783 2023-01-24 06:10:31.611138: step: 804/530, loss: 0.02661287970840931 2023-01-24 06:10:32.660229: step: 808/530, loss: 0.004242150112986565 2023-01-24 06:10:33.731257: step: 812/530, loss: 0.00043672951869666576 2023-01-24 06:10:34.770951: step: 816/530, loss: 0.004944864194840193 2023-01-24 06:10:35.824166: step: 820/530, loss: 0.002860134234651923 2023-01-24 06:10:36.874857: step: 824/530, loss: 0.010515425354242325 2023-01-24 06:10:37.916308: step: 828/530, loss: 0.006130465306341648 2023-01-24 06:10:38.948529: step: 832/530, loss: 0.006505517289042473 2023-01-24 06:10:40.006937: step: 836/530, loss: 0.005574814509600401 2023-01-24 06:10:41.053466: step: 840/530, loss: 0.0022138457279652357 2023-01-24 06:10:42.094992: step: 844/530, loss: 0.001904115080833435 2023-01-24 06:10:43.133464: step: 848/530, loss: 0.009070370346307755 2023-01-24 06:10:44.163782: step: 852/530, loss: 0.0078091854229569435 2023-01-24 06:10:45.193460: step: 856/530, loss: 0.006255922839045525 2023-01-24 06:10:46.255361: step: 860/530, loss: 0.004079470876604319 2023-01-24 06:10:47.295261: step: 864/530, loss: 0.024813443422317505 2023-01-24 06:10:48.328056: step: 868/530, loss: 0.009829799644649029 2023-01-24 06:10:49.355145: step: 872/530, loss: 0.0006468616193160415 2023-01-24 06:10:50.403046: step: 876/530, loss: 0.010373394005000591 2023-01-24 06:10:51.446741: step: 880/530, loss: 0.0077370535582304 2023-01-24 06:10:52.500995: step: 884/530, loss: 0.009096537716686726 2023-01-24 06:10:53.564278: step: 888/530, loss: 0.006196631584316492 2023-01-24 06:10:54.603129: step: 892/530, loss: 0.013388208113610744 2023-01-24 06:10:55.650858: step: 896/530, loss: 0.00273515866138041 2023-01-24 06:10:56.703240: step: 900/530, loss: 0.037651825696229935 2023-01-24 06:10:57.754755: step: 904/530, loss: 0.001838191761635244 2023-01-24 06:10:58.803925: step: 908/530, loss: 0.01699456200003624 2023-01-24 06:10:59.851809: step: 912/530, loss: 0.019773347303271294 2023-01-24 06:11:00.897330: step: 916/530, loss: 0.005390337202697992 2023-01-24 06:11:01.954938: step: 920/530, loss: 0.003894219407811761 2023-01-24 06:11:03.005190: step: 924/530, loss: 0.002449760679155588 2023-01-24 06:11:04.058358: step: 928/530, loss: 0.006844779476523399 2023-01-24 06:11:05.103811: step: 932/530, loss: 0.0027226568199694157 2023-01-24 06:11:06.155444: step: 936/530, loss: 0.0017901048995554447 2023-01-24 06:11:07.208007: step: 940/530, loss: 0.0005953708314336836 2023-01-24 06:11:08.277063: step: 944/530, loss: 0.006889801938086748 2023-01-24 06:11:09.327809: step: 948/530, loss: 0.009537424892187119 2023-01-24 06:11:10.383272: step: 952/530, loss: 0.0047201733104884624 2023-01-24 06:11:11.436216: step: 956/530, loss: 0.002545745112001896 2023-01-24 06:11:12.484364: step: 960/530, loss: 0.0071816653944551945 2023-01-24 06:11:13.534593: step: 964/530, loss: 0.0063903070986270905 2023-01-24 06:11:14.572288: step: 968/530, loss: 0.007996964268386364 2023-01-24 06:11:15.622219: step: 972/530, loss: 0.020088938996195793 2023-01-24 06:11:16.671139: step: 976/530, loss: 0.026697447523474693 2023-01-24 06:11:17.715657: step: 980/530, loss: 0.0035822000354528427 2023-01-24 06:11:18.772548: step: 984/530, loss: 0.05621730536222458 2023-01-24 06:11:19.822949: step: 988/530, loss: 0.0037705895956605673 2023-01-24 06:11:20.868727: step: 992/530, loss: 0.007121534086763859 2023-01-24 06:11:21.912798: step: 996/530, loss: 0.010187803767621517 2023-01-24 06:11:22.952449: step: 1000/530, loss: 0.004600352607667446 2023-01-24 06:11:23.994286: step: 1004/530, loss: 0.00710757402703166 2023-01-24 06:11:25.040272: step: 1008/530, loss: 0.013693444430828094 2023-01-24 06:11:26.087019: step: 1012/530, loss: 0.006806944962590933 2023-01-24 06:11:27.131250: step: 1016/530, loss: 0.005661698989570141 2023-01-24 06:11:28.169012: step: 1020/530, loss: 0.021601727232336998 2023-01-24 06:11:29.205727: step: 1024/530, loss: 0.0143333300948143 2023-01-24 06:11:30.250073: step: 1028/530, loss: 0.0030909921042621136 2023-01-24 06:11:31.287959: step: 1032/530, loss: 0.025878949090838432 2023-01-24 06:11:32.363178: step: 1036/530, loss: 0.022994389757514 2023-01-24 06:11:33.404754: step: 1040/530, loss: 0.007277947384864092 2023-01-24 06:11:34.435647: step: 1044/530, loss: 0.0001771945389918983 2023-01-24 06:11:35.480989: step: 1048/530, loss: 0.025386063382029533 2023-01-24 06:11:36.520526: step: 1052/530, loss: 0.013307204470038414 2023-01-24 06:11:37.576542: step: 1056/530, loss: 0.0018151187105104327 2023-01-24 06:11:38.613106: step: 1060/530, loss: 0.004172686021775007 2023-01-24 06:11:39.645193: step: 1064/530, loss: 0.008838359266519547 2023-01-24 06:11:40.685284: step: 1068/530, loss: 0.01083298772573471 2023-01-24 06:11:41.724924: step: 1072/530, loss: 0.023340122774243355 2023-01-24 06:11:42.752915: step: 1076/530, loss: 0.01825847290456295 2023-01-24 06:11:43.806036: step: 1080/530, loss: 0.005503007210791111 2023-01-24 06:11:44.852563: step: 1084/530, loss: 0.009955443441867828 2023-01-24 06:11:45.885537: step: 1088/530, loss: 0.004059256985783577 2023-01-24 06:11:46.917518: step: 1092/530, loss: 0.012757353484630585 2023-01-24 06:11:47.969923: step: 1096/530, loss: 0.019996175542473793 2023-01-24 06:11:49.006941: step: 1100/530, loss: 0.012939047068357468 2023-01-24 06:11:50.052185: step: 1104/530, loss: 0.0037144487723708153 2023-01-24 06:11:51.096003: step: 1108/530, loss: 0.008983484469354153 2023-01-24 06:11:52.155679: step: 1112/530, loss: 0.0027749284636229277 2023-01-24 06:11:53.194272: step: 1116/530, loss: 0.0632312148809433 2023-01-24 06:11:54.226899: step: 1120/530, loss: 0.010624143294990063 2023-01-24 06:11:55.263880: step: 1124/530, loss: 0.002980514196678996 2023-01-24 06:11:56.313861: step: 1128/530, loss: 0.029609989374876022 2023-01-24 06:11:57.359538: step: 1132/530, loss: 0.013118281029164791 2023-01-24 06:11:58.411109: step: 1136/530, loss: 0.0006186221726238728 2023-01-24 06:11:59.461791: step: 1140/530, loss: 0.00036158814327791333 2023-01-24 06:12:00.497544: step: 1144/530, loss: 0.00920632854104042 2023-01-24 06:12:01.534350: step: 1148/530, loss: 0.020401351153850555 2023-01-24 06:12:02.569048: step: 1152/530, loss: 0.0003302432014606893 2023-01-24 06:12:03.647307: step: 1156/530, loss: 0.021824853494763374 2023-01-24 06:12:04.695668: step: 1160/530, loss: 0.012219293043017387 2023-01-24 06:12:05.734939: step: 1164/530, loss: 0.013180164620280266 2023-01-24 06:12:06.776663: step: 1168/530, loss: 0.0035963330883532763 2023-01-24 06:12:07.814370: step: 1172/530, loss: 0.002271289238706231 2023-01-24 06:12:08.844069: step: 1176/530, loss: 0.02488148957490921 2023-01-24 06:12:09.882601: step: 1180/530, loss: 0.002901423256844282 2023-01-24 06:12:10.952480: step: 1184/530, loss: 0.0026070319581776857 2023-01-24 06:12:11.996075: step: 1188/530, loss: 0.0025322569999843836 2023-01-24 06:12:13.032395: step: 1192/530, loss: 0.0012351305922493339 2023-01-24 06:12:14.072334: step: 1196/530, loss: 0.011039367876946926 2023-01-24 06:12:15.113865: step: 1200/530, loss: 0.009021017700433731 2023-01-24 06:12:16.143800: step: 1204/530, loss: 0.002864608308300376 2023-01-24 06:12:17.194594: step: 1208/530, loss: 0.014229614287614822 2023-01-24 06:12:18.240426: step: 1212/530, loss: 0.02456767112016678 2023-01-24 06:12:19.284796: step: 1216/530, loss: 0.01543382741510868 2023-01-24 06:12:20.326092: step: 1220/530, loss: 0.004292861558496952 2023-01-24 06:12:21.364173: step: 1224/530, loss: 0.007197290658950806 2023-01-24 06:12:22.404509: step: 1228/530, loss: 0.01018136739730835 2023-01-24 06:12:23.446031: step: 1232/530, loss: 0.002991825109347701 2023-01-24 06:12:24.481755: step: 1236/530, loss: 0.022423578426241875 2023-01-24 06:12:25.531473: step: 1240/530, loss: 0.002303708577528596 2023-01-24 06:12:26.573560: step: 1244/530, loss: 0.021710142493247986 2023-01-24 06:12:27.638517: step: 1248/530, loss: 0.009048247709870338 2023-01-24 06:12:28.680155: step: 1252/530, loss: 0.035389285534620285 2023-01-24 06:12:29.730997: step: 1256/530, loss: 0.010742432437837124 2023-01-24 06:12:30.770973: step: 1260/530, loss: 0.010142643935978413 2023-01-24 06:12:31.806330: step: 1264/530, loss: 0.022211836650967598 2023-01-24 06:12:32.851780: step: 1268/530, loss: 0.007839965634047985 2023-01-24 06:12:33.890882: step: 1272/530, loss: 0.02114162966609001 2023-01-24 06:12:34.923338: step: 1276/530, loss: 0.013651162385940552 2023-01-24 06:12:35.964399: step: 1280/530, loss: 0.005986716598272324 2023-01-24 06:12:37.011473: step: 1284/530, loss: 0.017527097836136818 2023-01-24 06:12:38.048885: step: 1288/530, loss: 0.004508642479777336 2023-01-24 06:12:39.088631: step: 1292/530, loss: 0.04023851826786995 2023-01-24 06:12:40.117536: step: 1296/530, loss: 0.006751182954758406 2023-01-24 06:12:41.172995: step: 1300/530, loss: 0.016403554007411003 2023-01-24 06:12:42.224493: step: 1304/530, loss: 0.0015220451168715954 2023-01-24 06:12:43.268125: step: 1308/530, loss: 0.004788473714143038 2023-01-24 06:12:44.319193: step: 1312/530, loss: 0.010849830694496632 2023-01-24 06:12:45.362818: step: 1316/530, loss: 0.004726604092866182 2023-01-24 06:12:46.401537: step: 1320/530, loss: 0.026048095896840096 2023-01-24 06:12:47.454647: step: 1324/530, loss: 0.02229171432554722 2023-01-24 06:12:48.504084: step: 1328/530, loss: 0.0006768946768715978 2023-01-24 06:12:49.535864: step: 1332/530, loss: 0.0069791232235729694 2023-01-24 06:12:50.579634: step: 1336/530, loss: 0.0015911575173959136 2023-01-24 06:12:51.626733: step: 1340/530, loss: 0.0032544168643653393 2023-01-24 06:12:52.662376: step: 1344/530, loss: 0.005280646961182356 2023-01-24 06:12:53.705739: step: 1348/530, loss: 0.00202184752561152 2023-01-24 06:12:54.749097: step: 1352/530, loss: 0.0004644987639039755 2023-01-24 06:12:55.794619: step: 1356/530, loss: 0.010267892852425575 2023-01-24 06:12:56.844608: step: 1360/530, loss: 0.003436907660216093 2023-01-24 06:12:57.892701: step: 1364/530, loss: 0.00423907907679677 2023-01-24 06:12:58.938251: step: 1368/530, loss: 0.019025731831789017 2023-01-24 06:12:59.980352: step: 1372/530, loss: 0.00795195996761322 2023-01-24 06:13:01.018202: step: 1376/530, loss: 3.6636803997680545e-05 2023-01-24 06:13:02.081892: step: 1380/530, loss: 0.004467297345399857 2023-01-24 06:13:03.138022: step: 1384/530, loss: 0.00039880044641904533 2023-01-24 06:13:04.204148: step: 1388/530, loss: 0.0064514027908444405 2023-01-24 06:13:05.240155: step: 1392/530, loss: 0.0030811401084065437 2023-01-24 06:13:06.296284: step: 1396/530, loss: 0.004701836965978146 2023-01-24 06:13:07.336228: step: 1400/530, loss: 0.0043533421121537685 2023-01-24 06:13:08.376591: step: 1404/530, loss: 0.01922466792166233 2023-01-24 06:13:09.412041: step: 1408/530, loss: 0.006513860542327166 2023-01-24 06:13:10.456654: step: 1412/530, loss: 0.057321395725011826 2023-01-24 06:13:11.510976: step: 1416/530, loss: 0.0027382546104490757 2023-01-24 06:13:12.575027: step: 1420/530, loss: 0.018424641340970993 2023-01-24 06:13:13.606668: step: 1424/530, loss: 0.004779089242219925 2023-01-24 06:13:14.645238: step: 1428/530, loss: 0.002440408570691943 2023-01-24 06:13:15.677018: step: 1432/530, loss: 0.01081522461026907 2023-01-24 06:13:16.715305: step: 1436/530, loss: 0.0016349562210962176 2023-01-24 06:13:17.747547: step: 1440/530, loss: 0.018720485270023346 2023-01-24 06:13:18.799687: step: 1444/530, loss: 0.009044265374541283 2023-01-24 06:13:19.848995: step: 1448/530, loss: 0.011946936137974262 2023-01-24 06:13:20.896100: step: 1452/530, loss: 0.0019487175159156322 2023-01-24 06:13:21.942811: step: 1456/530, loss: 0.05007105693221092 2023-01-24 06:13:22.981664: step: 1460/530, loss: 0.02294820360839367 2023-01-24 06:13:24.034040: step: 1464/530, loss: 0.016945742070674896 2023-01-24 06:13:25.068251: step: 1468/530, loss: 0.004874739795923233 2023-01-24 06:13:26.125853: step: 1472/530, loss: 0.00848757941275835 2023-01-24 06:13:27.172123: step: 1476/530, loss: 0.005451865494251251 2023-01-24 06:13:28.201751: step: 1480/530, loss: 0.002858688123524189 2023-01-24 06:13:29.254839: step: 1484/530, loss: 0.009365770034492016 2023-01-24 06:13:30.296908: step: 1488/530, loss: 0.01442341972142458 2023-01-24 06:13:31.327232: step: 1492/530, loss: 0.00444852514192462 2023-01-24 06:13:32.356536: step: 1496/530, loss: 0.0044186906889081 2023-01-24 06:13:33.390259: step: 1500/530, loss: 0.002757208188995719 2023-01-24 06:13:34.459485: step: 1504/530, loss: 0.009161938913166523 2023-01-24 06:13:35.490704: step: 1508/530, loss: 0.006433708593249321 2023-01-24 06:13:36.538888: step: 1512/530, loss: 0.011822265572845936 2023-01-24 06:13:37.584203: step: 1516/530, loss: 0.01151095051318407 2023-01-24 06:13:38.631243: step: 1520/530, loss: 0.004070369992405176 2023-01-24 06:13:39.683999: step: 1524/530, loss: 0.002289979485794902 2023-01-24 06:13:40.727422: step: 1528/530, loss: 0.0016516131581738591 2023-01-24 06:13:41.764052: step: 1532/530, loss: 0.0033080594148486853 2023-01-24 06:13:42.819479: step: 1536/530, loss: 0.015890631824731827 2023-01-24 06:13:43.875242: step: 1540/530, loss: 0.0019086874090135098 2023-01-24 06:13:44.935073: step: 1544/530, loss: 0.02645191363990307 2023-01-24 06:13:45.977466: step: 1548/530, loss: 0.005352192558348179 2023-01-24 06:13:47.012642: step: 1552/530, loss: 0.0018773925257846713 2023-01-24 06:13:48.047881: step: 1556/530, loss: 0.004711862187832594 2023-01-24 06:13:49.087884: step: 1560/530, loss: 0.007976806722581387 2023-01-24 06:13:50.128722: step: 1564/530, loss: 0.009661748073995113 2023-01-24 06:13:51.195312: step: 1568/530, loss: 0.006966938264667988 2023-01-24 06:13:52.228250: step: 1572/530, loss: 0.005844578146934509 2023-01-24 06:13:53.279355: step: 1576/530, loss: 0.02175166830420494 2023-01-24 06:13:54.330071: step: 1580/530, loss: 0.010553802363574505 2023-01-24 06:13:55.386580: step: 1584/530, loss: 0.018760759383440018 2023-01-24 06:13:56.429721: step: 1588/530, loss: 0.008100664243102074 2023-01-24 06:13:57.470369: step: 1592/530, loss: 0.002234217943623662 2023-01-24 06:13:58.515005: step: 1596/530, loss: 0.006893356796354055 2023-01-24 06:13:59.559233: step: 1600/530, loss: 0.006318795960396528 2023-01-24 06:14:00.600503: step: 1604/530, loss: 0.00822544563561678 2023-01-24 06:14:01.633450: step: 1608/530, loss: 0.008038416504859924 2023-01-24 06:14:02.691985: step: 1612/530, loss: 0.01708037406206131 2023-01-24 06:14:03.735852: step: 1616/530, loss: 0.006844771560281515 2023-01-24 06:14:04.765951: step: 1620/530, loss: 0.05640245974063873 2023-01-24 06:14:05.819058: step: 1624/530, loss: 0.011180452071130276 2023-01-24 06:14:06.860733: step: 1628/530, loss: 0.041737161576747894 2023-01-24 06:14:07.909220: step: 1632/530, loss: 0.004179058596491814 2023-01-24 06:14:08.946885: step: 1636/530, loss: 0.004697559867054224 2023-01-24 06:14:10.009227: step: 1640/530, loss: 0.04130321368575096 2023-01-24 06:14:11.066207: step: 1644/530, loss: 0.01205145101994276 2023-01-24 06:14:12.100189: step: 1648/530, loss: 0.01519062276929617 2023-01-24 06:14:13.161742: step: 1652/530, loss: 0.006274986546486616 2023-01-24 06:14:14.202890: step: 1656/530, loss: 0.02690383791923523 2023-01-24 06:14:15.235136: step: 1660/530, loss: 0.0022225563880056143 2023-01-24 06:14:16.284568: step: 1664/530, loss: 0.012799485586583614 2023-01-24 06:14:17.315766: step: 1668/530, loss: 0.013212735764682293 2023-01-24 06:14:18.347369: step: 1672/530, loss: 0.04080083221197128 2023-01-24 06:14:19.393040: step: 1676/530, loss: 0.005913273897022009 2023-01-24 06:14:20.448541: step: 1680/530, loss: 0.015069507993757725 2023-01-24 06:14:21.485129: step: 1684/530, loss: 0.004546095617115498 2023-01-24 06:14:22.516115: step: 1688/530, loss: 0.007551766466349363 2023-01-24 06:14:23.553221: step: 1692/530, loss: 0.010521274991333485 2023-01-24 06:14:24.593799: step: 1696/530, loss: 0.006171573884785175 2023-01-24 06:14:25.641490: step: 1700/530, loss: 0.03709413856267929 2023-01-24 06:14:26.676250: step: 1704/530, loss: 0.0009492139797657728 2023-01-24 06:14:27.724448: step: 1708/530, loss: 0.005416674539446831 2023-01-24 06:14:28.757405: step: 1712/530, loss: 0.0021202301140874624 2023-01-24 06:14:29.793717: step: 1716/530, loss: 0.0019722450524568558 2023-01-24 06:14:30.835280: step: 1720/530, loss: 0.014917327091097832 2023-01-24 06:14:31.877374: step: 1724/530, loss: 0.008332163095474243 2023-01-24 06:14:32.949978: step: 1728/530, loss: 0.009225474670529366 2023-01-24 06:14:33.997875: step: 1732/530, loss: 0.001848805695772171 2023-01-24 06:14:35.037747: step: 1736/530, loss: 0.013050920329988003 2023-01-24 06:14:36.085616: step: 1740/530, loss: 0.0025201637763530016 2023-01-24 06:14:37.140781: step: 1744/530, loss: 0.004326107446104288 2023-01-24 06:14:38.188625: step: 1748/530, loss: 0.005695197265595198 2023-01-24 06:14:39.242299: step: 1752/530, loss: 0.012486633844673634 2023-01-24 06:14:40.295891: step: 1756/530, loss: 0.006287648808211088 2023-01-24 06:14:41.339163: step: 1760/530, loss: 0.019704468548297882 2023-01-24 06:14:42.374165: step: 1764/530, loss: 0.005859240423887968 2023-01-24 06:14:43.422450: step: 1768/530, loss: 0.0019336638506501913 2023-01-24 06:14:44.480643: step: 1772/530, loss: 0.005709787365049124 2023-01-24 06:14:45.536525: step: 1776/530, loss: 0.003635913133621216 2023-01-24 06:14:46.591363: step: 1780/530, loss: 0.005575036630034447 2023-01-24 06:14:47.638066: step: 1784/530, loss: 0.0020982197020202875 2023-01-24 06:14:48.664070: step: 1788/530, loss: 0.02108420990407467 2023-01-24 06:14:49.709685: step: 1792/530, loss: 0.005897968076169491 2023-01-24 06:14:50.740405: step: 1796/530, loss: 0.006525702774524689 2023-01-24 06:14:51.786074: step: 1800/530, loss: 0.00445253262296319 2023-01-24 06:14:52.841608: step: 1804/530, loss: 0.013924259692430496 2023-01-24 06:14:53.888697: step: 1808/530, loss: 0.04297326132655144 2023-01-24 06:14:54.926917: step: 1812/530, loss: 0.004864335525780916 2023-01-24 06:14:55.964681: step: 1816/530, loss: 0.012600874528288841 2023-01-24 06:14:57.010898: step: 1820/530, loss: 0.011261162348091602 2023-01-24 06:14:58.074625: step: 1824/530, loss: 0.01003257930278778 2023-01-24 06:14:59.138280: step: 1828/530, loss: 0.007177611812949181 2023-01-24 06:15:00.192577: step: 1832/530, loss: 0.005457644816488028 2023-01-24 06:15:01.229888: step: 1836/530, loss: 0.010346289724111557 2023-01-24 06:15:02.292289: step: 1840/530, loss: 0.02937886118888855 2023-01-24 06:15:03.336468: step: 1844/530, loss: 0.009209373965859413 2023-01-24 06:15:04.392159: step: 1848/530, loss: 0.009007374756038189 2023-01-24 06:15:05.419497: step: 1852/530, loss: 0.010204768739640713 2023-01-24 06:15:06.461307: step: 1856/530, loss: 0.005483309272676706 2023-01-24 06:15:07.489912: step: 1860/530, loss: 0.0017381259240210056 2023-01-24 06:15:08.550138: step: 1864/530, loss: 0.0029665653128176928 2023-01-24 06:15:09.589866: step: 1868/530, loss: 0.0047257947735488415 2023-01-24 06:15:10.628010: step: 1872/530, loss: 0.003776599420234561 2023-01-24 06:15:11.683223: step: 1876/530, loss: 0.008062978275120258 2023-01-24 06:15:12.730016: step: 1880/530, loss: 0.008315728977322578 2023-01-24 06:15:13.768868: step: 1884/530, loss: 0.0033979981672018766 2023-01-24 06:15:14.815690: step: 1888/530, loss: 0.010533134452998638 2023-01-24 06:15:15.857833: step: 1892/530, loss: 0.019899064674973488 2023-01-24 06:15:16.898459: step: 1896/530, loss: 0.0027368925511837006 2023-01-24 06:15:17.940665: step: 1900/530, loss: 0.04092983528971672 2023-01-24 06:15:19.000391: step: 1904/530, loss: 0.00851442664861679 2023-01-24 06:15:20.040328: step: 1908/530, loss: 0.02917405776679516 2023-01-24 06:15:21.073226: step: 1912/530, loss: 0.01269491482526064 2023-01-24 06:15:22.125134: step: 1916/530, loss: 0.007485529407858849 2023-01-24 06:15:23.200572: step: 1920/530, loss: 0.004053287208080292 2023-01-24 06:15:24.251419: step: 1924/530, loss: 0.0034167389385402203 2023-01-24 06:15:25.292144: step: 1928/530, loss: 0.00985283125191927 2023-01-24 06:15:26.337982: step: 1932/530, loss: 0.004041532054543495 2023-01-24 06:15:27.371256: step: 1936/530, loss: 0.007994909770786762 2023-01-24 06:15:28.414670: step: 1940/530, loss: 0.06089195981621742 2023-01-24 06:15:29.454422: step: 1944/530, loss: 0.004458821844309568 2023-01-24 06:15:30.478905: step: 1948/530, loss: 0.004738977644592524 2023-01-24 06:15:31.522302: step: 1952/530, loss: 0.01475786603987217 2023-01-24 06:15:32.576584: step: 1956/530, loss: 0.024411706253886223 2023-01-24 06:15:33.634720: step: 1960/530, loss: 0.011239174753427505 2023-01-24 06:15:34.694255: step: 1964/530, loss: 0.031950339674949646 2023-01-24 06:15:35.744288: step: 1968/530, loss: 0.031904272735118866 2023-01-24 06:15:36.777906: step: 1972/530, loss: 0.003503339132294059 2023-01-24 06:15:37.831717: step: 1976/530, loss: 0.0022566267289221287 2023-01-24 06:15:38.881102: step: 1980/530, loss: 0.022635025903582573 2023-01-24 06:15:39.927359: step: 1984/530, loss: 0.014758494682610035 2023-01-24 06:15:40.986900: step: 1988/530, loss: 0.002663377206772566 2023-01-24 06:15:42.044002: step: 1992/530, loss: 0.004463164601475 2023-01-24 06:15:43.094955: step: 1996/530, loss: 0.005761934909969568 2023-01-24 06:15:44.139041: step: 2000/530, loss: 0.006272409576922655 2023-01-24 06:15:45.186524: step: 2004/530, loss: 0.0031166779808700085 2023-01-24 06:15:46.238911: step: 2008/530, loss: 0.012926271185278893 2023-01-24 06:15:47.277042: step: 2012/530, loss: 0.01276963111013174 2023-01-24 06:15:48.316654: step: 2016/530, loss: 0.002114873146638274 2023-01-24 06:15:49.350621: step: 2020/530, loss: 0.011003976687788963 2023-01-24 06:15:50.405882: step: 2024/530, loss: 0.0037110212724655867 2023-01-24 06:15:51.450348: step: 2028/530, loss: 0.04115549474954605 2023-01-24 06:15:52.494779: step: 2032/530, loss: 0.0006640140782110393 2023-01-24 06:15:53.540747: step: 2036/530, loss: 0.0007594458875246346 2023-01-24 06:15:54.583789: step: 2040/530, loss: 0.003376855980604887 2023-01-24 06:15:55.629286: step: 2044/530, loss: 0.012279235757887363 2023-01-24 06:15:56.727935: step: 2048/530, loss: 0.00034014126867987216 2023-01-24 06:15:57.781358: step: 2052/530, loss: 0.000714337860699743 2023-01-24 06:15:58.822260: step: 2056/530, loss: 0.0021405701991170645 2023-01-24 06:15:59.867810: step: 2060/530, loss: 0.005742653273046017 2023-01-24 06:16:00.918123: step: 2064/530, loss: 0.0018683884991332889 2023-01-24 06:16:01.999570: step: 2068/530, loss: 0.0021885179448872805 2023-01-24 06:16:03.031134: step: 2072/530, loss: 0.001408782321959734 2023-01-24 06:16:04.087934: step: 2076/530, loss: 0.001911174738779664 2023-01-24 06:16:05.136543: step: 2080/530, loss: 0.00855308212339878 2023-01-24 06:16:06.180678: step: 2084/530, loss: 0.010563374496996403 2023-01-24 06:16:07.230776: step: 2088/530, loss: 0.004736981354653835 2023-01-24 06:16:08.276042: step: 2092/530, loss: 0.0024413892533630133 2023-01-24 06:16:09.331847: step: 2096/530, loss: 0.0101556908339262 2023-01-24 06:16:10.368963: step: 2100/530, loss: 0.00508415512740612 2023-01-24 06:16:11.437955: step: 2104/530, loss: 0.004340960178524256 2023-01-24 06:16:12.473573: step: 2108/530, loss: 0.010126103647053242 2023-01-24 06:16:13.520334: step: 2112/530, loss: 0.024528298527002335 2023-01-24 06:16:14.556834: step: 2116/530, loss: 0.00544694671407342 2023-01-24 06:16:15.608155: step: 2120/530, loss: 0.007919400930404663 ================================================== Loss: 0.010 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3901686065051021, 'r': 0.3316803334236921, 'f1': 0.3585549450549451}, 'combined': 0.26419838056680167, 'stategy': 1, 'epoch': 6} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.372921689895649, 'r': 0.369151341927954, 'f1': 0.37102693766061334}, 'combined': 0.2875902578996142, 'stategy': 1, 'epoch': 6} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38162687387231753, 'r': 0.33093639726688634, 'f1': 0.3544786206496933}, 'combined': 0.2611947731103003, 'stategy': 1, 'epoch': 6} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36231071373713714, 'r': 0.36231071373713714, 'f1': 0.3623107137371372}, 'combined': 0.280834141748403, 'stategy': 1, 'epoch': 6} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 6} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 6} New best chinese model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38236684276980326, 'r': 0.33520584698225636, 'f1': 0.35723656493356754}, 'combined': 0.2632269425826287, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3561820350737081, 'r': 0.35978314020772534, 'f1': 0.35797353136351645}, 'combined': 0.27747230660712763, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 7 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 06:18:45.534154: step: 4/530, loss: 0.011587036773562431 2023-01-24 06:18:46.596285: step: 8/530, loss: 0.008058561012148857 2023-01-24 06:18:47.644099: step: 12/530, loss: 0.009622877463698387 2023-01-24 06:18:48.672627: step: 16/530, loss: 0.00474189966917038 2023-01-24 06:18:49.698202: step: 20/530, loss: 0.017884546890854836 2023-01-24 06:18:50.737025: step: 24/530, loss: 0.012270621955394745 2023-01-24 06:18:51.780404: step: 28/530, loss: 0.024582723155617714 2023-01-24 06:18:52.816111: step: 32/530, loss: 0.0006849112687632442 2023-01-24 06:18:53.861932: step: 36/530, loss: 0.012950761243700981 2023-01-24 06:18:54.911544: step: 40/530, loss: 0.00873364694416523 2023-01-24 06:18:55.941508: step: 44/530, loss: 0.0024029721971601248 2023-01-24 06:18:56.983256: step: 48/530, loss: 5.633518594549969e-05 2023-01-24 06:18:58.032404: step: 52/530, loss: 0.002093082293868065 2023-01-24 06:18:59.072284: step: 56/530, loss: 0.003843276994302869 2023-01-24 06:19:00.109846: step: 60/530, loss: 0.003618384012952447 2023-01-24 06:19:01.152046: step: 64/530, loss: 0.03478454798460007 2023-01-24 06:19:02.196425: step: 68/530, loss: 0.008315201848745346 2023-01-24 06:19:03.251491: step: 72/530, loss: 0.002127622254192829 2023-01-24 06:19:04.306681: step: 76/530, loss: 0.006504325661808252 2023-01-24 06:19:05.340455: step: 80/530, loss: 0.0010370308300480247 2023-01-24 06:19:06.376952: step: 84/530, loss: 0.005459685809910297 2023-01-24 06:19:07.423524: step: 88/530, loss: 0.010153745301067829 2023-01-24 06:19:08.457598: step: 92/530, loss: 0.008685597218573093 2023-01-24 06:19:09.505977: step: 96/530, loss: 0.0016931957798078656 2023-01-24 06:19:10.545429: step: 100/530, loss: 0.0009202314540743828 2023-01-24 06:19:11.577916: step: 104/530, loss: 0.009704441763460636 2023-01-24 06:19:12.619857: step: 108/530, loss: 0.02716992050409317 2023-01-24 06:19:13.670318: step: 112/530, loss: 0.0056611159816384315 2023-01-24 06:19:14.702129: step: 116/530, loss: 0.0019131782464683056 2023-01-24 06:19:15.742587: step: 120/530, loss: 0.008631687611341476 2023-01-24 06:19:16.788051: step: 124/530, loss: 0.00399860879406333 2023-01-24 06:19:17.830876: step: 128/530, loss: 0.005334592889994383 2023-01-24 06:19:18.865127: step: 132/530, loss: 0.014294576831161976 2023-01-24 06:19:19.912578: step: 136/530, loss: 0.017037982121109962 2023-01-24 06:19:20.957568: step: 140/530, loss: 0.00272139860317111 2023-01-24 06:19:21.998000: step: 144/530, loss: 0.03012244403362274 2023-01-24 06:19:23.059209: step: 148/530, loss: 0.001278023119084537 2023-01-24 06:19:24.105297: step: 152/530, loss: 0.0034183640964329243 2023-01-24 06:19:25.150581: step: 156/530, loss: 0.0046643540263175964 2023-01-24 06:19:26.196183: step: 160/530, loss: 0.007372661028057337 2023-01-24 06:19:27.239841: step: 164/530, loss: 0.0008810541476123035 2023-01-24 06:19:28.282649: step: 168/530, loss: 0.009536619298160076 2023-01-24 06:19:29.335324: step: 172/530, loss: 0.002241946989670396 2023-01-24 06:19:30.372307: step: 176/530, loss: 0.003911525011062622 2023-01-24 06:19:31.412154: step: 180/530, loss: 0.0025393657851964235 2023-01-24 06:19:32.458826: step: 184/530, loss: 0.004790137056261301 2023-01-24 06:19:33.490635: step: 188/530, loss: 0.00042702045175246894 2023-01-24 06:19:34.539214: step: 192/530, loss: 0.004295692313462496 2023-01-24 06:19:35.581768: step: 196/530, loss: 0.0034668322186917067 2023-01-24 06:19:36.622040: step: 200/530, loss: 0.01009513158351183 2023-01-24 06:19:37.650331: step: 204/530, loss: 0.006042029242962599 2023-01-24 06:19:38.699094: step: 208/530, loss: 0.015337937511503696 2023-01-24 06:19:39.736756: step: 212/530, loss: 0.0026511764153838158 2023-01-24 06:19:40.791985: step: 216/530, loss: 0.003912328276783228 2023-01-24 06:19:41.830865: step: 220/530, loss: 0.0022922749631106853 2023-01-24 06:19:42.879382: step: 224/530, loss: 0.012015871703624725 2023-01-24 06:19:43.931677: step: 228/530, loss: 0.00681014871224761 2023-01-24 06:19:44.986790: step: 232/530, loss: 0.0022635767236351967 2023-01-24 06:19:46.029484: step: 236/530, loss: 0.014557711780071259 2023-01-24 06:19:47.080633: step: 240/530, loss: 0.005466057453304529 2023-01-24 06:19:48.127347: step: 244/530, loss: 0.0012775585055351257 2023-01-24 06:19:49.171343: step: 248/530, loss: 0.01565469801425934 2023-01-24 06:19:50.229969: step: 252/530, loss: 0.004362897947430611 2023-01-24 06:19:51.312412: step: 256/530, loss: 0.02090446650981903 2023-01-24 06:19:52.353558: step: 260/530, loss: 0.011011134833097458 2023-01-24 06:19:53.401336: step: 264/530, loss: 0.0014319868059828877 2023-01-24 06:19:54.458631: step: 268/530, loss: 0.006045954301953316 2023-01-24 06:19:55.497561: step: 272/530, loss: 0.0225754976272583 2023-01-24 06:19:56.544460: step: 276/530, loss: 0.0027312817983329296 2023-01-24 06:19:57.592199: step: 280/530, loss: 0.0006080306484363973 2023-01-24 06:19:58.628757: step: 284/530, loss: 0.0031787727493792772 2023-01-24 06:19:59.678293: step: 288/530, loss: 6.515099084936082e-05 2023-01-24 06:20:00.729821: step: 292/530, loss: 0.00177150743547827 2023-01-24 06:20:01.808220: step: 296/530, loss: 0.0148751987144351 2023-01-24 06:20:02.861455: step: 300/530, loss: 0.026419559493660927 2023-01-24 06:20:03.916953: step: 304/530, loss: 0.0022575596813112497 2023-01-24 06:20:04.973569: step: 308/530, loss: 0.005201238207519054 2023-01-24 06:20:06.029367: step: 312/530, loss: 0.0711824893951416 2023-01-24 06:20:07.073988: step: 316/530, loss: 0.005875852424651384 2023-01-24 06:20:08.112881: step: 320/530, loss: 0.0016077982727438211 2023-01-24 06:20:09.151109: step: 324/530, loss: 0.002177596092224121 2023-01-24 06:20:10.203154: step: 328/530, loss: 0.0152108334004879 2023-01-24 06:20:11.235279: step: 332/530, loss: 0.001335029024630785 2023-01-24 06:20:12.274868: step: 336/530, loss: 0.00045931493514217436 2023-01-24 06:20:13.321061: step: 340/530, loss: 0.002613889053463936 2023-01-24 06:20:14.364401: step: 344/530, loss: 0.0006383536383509636 2023-01-24 06:20:15.406334: step: 348/530, loss: 0.0064877974800765514 2023-01-24 06:20:16.450380: step: 352/530, loss: 0.0014528051251545548 2023-01-24 06:20:17.505469: step: 356/530, loss: 0.007218583486974239 2023-01-24 06:20:18.543393: step: 360/530, loss: 0.002755946945399046 2023-01-24 06:20:19.592519: step: 364/530, loss: 0.003286286722868681 2023-01-24 06:20:20.619513: step: 368/530, loss: 0.00666410569101572 2023-01-24 06:20:21.646710: step: 372/530, loss: 0.0016173524782061577 2023-01-24 06:20:22.762148: step: 376/530, loss: 0.008841770701110363 2023-01-24 06:20:23.820590: step: 380/530, loss: 0.0210097823292017 2023-01-24 06:20:24.882511: step: 384/530, loss: 0.0037013778928667307 2023-01-24 06:20:25.934221: step: 388/530, loss: 0.058689914643764496 2023-01-24 06:20:26.985031: step: 392/530, loss: 0.01135192159563303 2023-01-24 06:20:28.045638: step: 396/530, loss: 0.0011508228490129113 2023-01-24 06:20:29.078690: step: 400/530, loss: 0.013402036391198635 2023-01-24 06:20:30.129722: step: 404/530, loss: 0.00433835806325078 2023-01-24 06:20:31.181611: step: 408/530, loss: 0.005923935677856207 2023-01-24 06:20:32.229222: step: 412/530, loss: 0.0013145239790901542 2023-01-24 06:20:33.275601: step: 416/530, loss: 0.014649472199380398 2023-01-24 06:20:34.330521: step: 420/530, loss: 0.002501662587746978 2023-01-24 06:20:35.363183: step: 424/530, loss: 0.00226204888895154 2023-01-24 06:20:36.402492: step: 428/530, loss: 0.005570810753852129 2023-01-24 06:20:37.450124: step: 432/530, loss: 0.0018400277476757765 2023-01-24 06:20:38.504221: step: 436/530, loss: 0.0057077002711594105 2023-01-24 06:20:39.548654: step: 440/530, loss: 0.0029061168897897005 2023-01-24 06:20:40.626339: step: 444/530, loss: 0.004631864372640848 2023-01-24 06:20:41.677792: step: 448/530, loss: 0.013594035059213638 2023-01-24 06:20:42.720290: step: 452/530, loss: 0.006473762448877096 2023-01-24 06:20:43.770809: step: 456/530, loss: 0.024219676852226257 2023-01-24 06:20:44.815338: step: 460/530, loss: 0.01045110821723938 2023-01-24 06:20:45.872568: step: 464/530, loss: 0.0012683115201070905 2023-01-24 06:20:46.915317: step: 468/530, loss: 0.027867794036865234 2023-01-24 06:20:47.962951: step: 472/530, loss: 0.01294589415192604 2023-01-24 06:20:49.014513: step: 476/530, loss: 0.009049591608345509 2023-01-24 06:20:50.056586: step: 480/530, loss: 0.0025234143249690533 2023-01-24 06:20:51.113305: step: 484/530, loss: 0.0033417821396142244 2023-01-24 06:20:52.174272: step: 488/530, loss: 0.014079265296459198 2023-01-24 06:20:53.207316: step: 492/530, loss: 0.0033510210923850536 2023-01-24 06:20:54.263880: step: 496/530, loss: 0.0005681717302650213 2023-01-24 06:20:55.292426: step: 500/530, loss: 0.011738928966224194 2023-01-24 06:20:56.344336: step: 504/530, loss: 0.0186759103089571 2023-01-24 06:20:57.396663: step: 508/530, loss: 0.003980475943535566 2023-01-24 06:20:58.433876: step: 512/530, loss: 0.008400819264352322 2023-01-24 06:20:59.482359: step: 516/530, loss: 0.007605388760566711 2023-01-24 06:21:00.545060: step: 520/530, loss: 0.009616143070161343 2023-01-24 06:21:01.591064: step: 524/530, loss: 0.003983595408499241 2023-01-24 06:21:02.645598: step: 528/530, loss: 0.006217450834810734 2023-01-24 06:21:03.702915: step: 532/530, loss: 0.00698980875313282 2023-01-24 06:21:04.749013: step: 536/530, loss: 0.010664377361536026 2023-01-24 06:21:05.793238: step: 540/530, loss: 0.0032485490664839745 2023-01-24 06:21:06.862983: step: 544/530, loss: 0.022555796429514885 2023-01-24 06:21:07.921085: step: 548/530, loss: 0.01435762643814087 2023-01-24 06:21:08.966718: step: 552/530, loss: 0.004576300270855427 2023-01-24 06:21:10.017544: step: 556/530, loss: 0.002943630563095212 2023-01-24 06:21:11.071708: step: 560/530, loss: 0.002787049161270261 2023-01-24 06:21:12.118309: step: 564/530, loss: 0.007462665904313326 2023-01-24 06:21:13.168326: step: 568/530, loss: 0.011899206787347794 2023-01-24 06:21:14.234052: step: 572/530, loss: 0.0024678679183125496 2023-01-24 06:21:15.272101: step: 576/530, loss: 0.003009113483130932 2023-01-24 06:21:16.310854: step: 580/530, loss: 0.011800347827374935 2023-01-24 06:21:17.348533: step: 584/530, loss: 0.014704861678183079 2023-01-24 06:21:18.384510: step: 588/530, loss: 1.7893730728246737e-06 2023-01-24 06:21:19.438894: step: 592/530, loss: 0.019476916640996933 2023-01-24 06:21:20.486527: step: 596/530, loss: 0.00475380988791585 2023-01-24 06:21:21.529615: step: 600/530, loss: 0.010056141763925552 2023-01-24 06:21:22.573712: step: 604/530, loss: 0.016903912648558617 2023-01-24 06:21:23.625290: step: 608/530, loss: 0.018231775611639023 2023-01-24 06:21:24.679456: step: 612/530, loss: 0.012347852811217308 2023-01-24 06:21:25.718137: step: 616/530, loss: 0.005395600106567144 2023-01-24 06:21:26.752985: step: 620/530, loss: 0.004717149306088686 2023-01-24 06:21:27.802376: step: 624/530, loss: 0.12797679007053375 2023-01-24 06:21:28.845092: step: 628/530, loss: 0.00015378544048871845 2023-01-24 06:21:29.892454: step: 632/530, loss: 0.03753596544265747 2023-01-24 06:21:30.919343: step: 636/530, loss: 0.0038369777612388134 2023-01-24 06:21:31.959161: step: 640/530, loss: 0.002048106398433447 2023-01-24 06:21:33.006582: step: 644/530, loss: 0.0035770984832197428 2023-01-24 06:21:34.061818: step: 648/530, loss: 0.004911252297461033 2023-01-24 06:21:35.119303: step: 652/530, loss: 0.014666815288364887 2023-01-24 06:21:36.162012: step: 656/530, loss: 0.026117080822587013 2023-01-24 06:21:37.194012: step: 660/530, loss: 0.00010257835674565285 2023-01-24 06:21:38.238038: step: 664/530, loss: 0.0025673743803054094 2023-01-24 06:21:39.273653: step: 668/530, loss: 0.0013420850737020373 2023-01-24 06:21:40.308239: step: 672/530, loss: 0.014642364345490932 2023-01-24 06:21:41.347699: step: 676/530, loss: 0.00024920047144405544 2023-01-24 06:21:42.392406: step: 680/530, loss: 0.0008633178658783436 2023-01-24 06:21:43.448934: step: 684/530, loss: 0.024829626083374023 2023-01-24 06:21:44.499085: step: 688/530, loss: 0.0017917653312906623 2023-01-24 06:21:45.547719: step: 692/530, loss: 0.014723587781190872 2023-01-24 06:21:46.592733: step: 696/530, loss: 0.007423742208629847 2023-01-24 06:21:47.633577: step: 700/530, loss: 0.006035512313246727 2023-01-24 06:21:48.685013: step: 704/530, loss: 0.013542910106480122 2023-01-24 06:21:49.728499: step: 708/530, loss: 0.005212020128965378 2023-01-24 06:21:50.769846: step: 712/530, loss: 0.006673903204500675 2023-01-24 06:21:51.801588: step: 716/530, loss: 0.005888357292860746 2023-01-24 06:21:52.822832: step: 720/530, loss: 0.001742396503686905 2023-01-24 06:21:53.886178: step: 724/530, loss: 0.009401286020874977 2023-01-24 06:21:54.938379: step: 728/530, loss: 0.01121896505355835 2023-01-24 06:21:55.975843: step: 732/530, loss: 0.0128102358430624 2023-01-24 06:21:57.007881: step: 736/530, loss: 0.005448071751743555 2023-01-24 06:21:58.049024: step: 740/530, loss: 0.00313611445017159 2023-01-24 06:21:59.088769: step: 744/530, loss: 0.006634856108576059 2023-01-24 06:22:00.125374: step: 748/530, loss: 0.010065586306154728 2023-01-24 06:22:01.191396: step: 752/530, loss: 0.004102368839085102 2023-01-24 06:22:02.232283: step: 756/530, loss: 0.01233601663261652 2023-01-24 06:22:03.278461: step: 760/530, loss: 0.011272737756371498 2023-01-24 06:22:04.317935: step: 764/530, loss: 0.05126696825027466 2023-01-24 06:22:05.348884: step: 768/530, loss: 0.0011142394505441189 2023-01-24 06:22:06.390090: step: 772/530, loss: 0.010090713389217854 2023-01-24 06:22:07.444935: step: 776/530, loss: 0.0035307412035763264 2023-01-24 06:22:08.495298: step: 780/530, loss: 0.002695351606234908 2023-01-24 06:22:09.534313: step: 784/530, loss: 0.006723582744598389 2023-01-24 06:22:10.581990: step: 788/530, loss: 0.00822901539504528 2023-01-24 06:22:11.637777: step: 792/530, loss: 0.055528152734041214 2023-01-24 06:22:12.689541: step: 796/530, loss: 0.03605087473988533 2023-01-24 06:22:13.743135: step: 800/530, loss: 0.042120590806007385 2023-01-24 06:22:14.792273: step: 804/530, loss: 0.017894096672534943 2023-01-24 06:22:15.826709: step: 808/530, loss: 0.0023750171530991793 2023-01-24 06:22:16.877601: step: 812/530, loss: 0.004050438292324543 2023-01-24 06:22:17.929321: step: 816/530, loss: 0.006625940091907978 2023-01-24 06:22:18.962666: step: 820/530, loss: 0.006925683468580246 2023-01-24 06:22:19.997795: step: 824/530, loss: 0.001783377374522388 2023-01-24 06:22:21.049617: step: 828/530, loss: 0.0013652881607413292 2023-01-24 06:22:22.091828: step: 832/530, loss: 0.02358374185860157 2023-01-24 06:22:23.133070: step: 836/530, loss: 0.00915016420185566 2023-01-24 06:22:24.174176: step: 840/530, loss: 0.021526407450437546 2023-01-24 06:22:25.211548: step: 844/530, loss: 0.0072245243936777115 2023-01-24 06:22:26.245770: step: 848/530, loss: 0.011357876472175121 2023-01-24 06:22:27.300610: step: 852/530, loss: 0.004106700886040926 2023-01-24 06:22:28.341707: step: 856/530, loss: 0.0035375088918954134 2023-01-24 06:22:29.390696: step: 860/530, loss: 0.00566155556589365 2023-01-24 06:22:30.422875: step: 864/530, loss: 0.003982520196586847 2023-01-24 06:22:31.460183: step: 868/530, loss: 0.013738138601183891 2023-01-24 06:22:32.492954: step: 872/530, loss: 0.0007419064058922231 2023-01-24 06:22:33.541329: step: 876/530, loss: 0.0013948254054412246 2023-01-24 06:22:34.602343: step: 880/530, loss: 0.03332987427711487 2023-01-24 06:22:35.640922: step: 884/530, loss: 0.0021401913836598396 2023-01-24 06:22:36.692574: step: 888/530, loss: 0.005231750663369894 2023-01-24 06:22:37.733555: step: 892/530, loss: 0.003046355675905943 2023-01-24 06:22:38.762491: step: 896/530, loss: 0.024647263810038567 2023-01-24 06:22:39.805397: step: 900/530, loss: 0.002115655457600951 2023-01-24 06:22:40.849930: step: 904/530, loss: 0.008259736001491547 2023-01-24 06:22:41.895521: step: 908/530, loss: 0.011261925101280212 2023-01-24 06:22:42.939794: step: 912/530, loss: 0.0063118175603449345 2023-01-24 06:22:43.985875: step: 916/530, loss: 0.002154545858502388 2023-01-24 06:22:45.030729: step: 920/530, loss: 0.013554207980632782 2023-01-24 06:22:46.076866: step: 924/530, loss: 0.007091938052326441 2023-01-24 06:22:47.126149: step: 928/530, loss: 0.0002836388011928648 2023-01-24 06:22:48.179273: step: 932/530, loss: 0.0044651515781879425 2023-01-24 06:22:49.226472: step: 936/530, loss: 0.00012386986054480076 2023-01-24 06:22:50.256361: step: 940/530, loss: 0.0012076901039108634 2023-01-24 06:22:51.297168: step: 944/530, loss: 0.022072333842515945 2023-01-24 06:22:52.348509: step: 948/530, loss: 0.00045723607763648033 2023-01-24 06:22:53.386880: step: 952/530, loss: 0.0022414680570364 2023-01-24 06:22:54.414023: step: 956/530, loss: 0.0011253998382017016 2023-01-24 06:22:55.465060: step: 960/530, loss: 0.0028189762961119413 2023-01-24 06:22:56.522373: step: 964/530, loss: 0.007082141470164061 2023-01-24 06:22:57.570205: step: 968/530, loss: 0.0015966114588081837 2023-01-24 06:22:58.620648: step: 972/530, loss: 0.0062012518756091595 2023-01-24 06:22:59.660094: step: 976/530, loss: 0.003764570225030184 2023-01-24 06:23:00.706515: step: 980/530, loss: 0.005828135646879673 2023-01-24 06:23:01.776575: step: 984/530, loss: 0.0010315744439139962 2023-01-24 06:23:02.809536: step: 988/530, loss: 0.005860264878720045 2023-01-24 06:23:03.876296: step: 992/530, loss: 0.022004127502441406 2023-01-24 06:23:04.913999: step: 996/530, loss: 0.033604830503463745 2023-01-24 06:23:05.955922: step: 1000/530, loss: 0.002532367594540119 2023-01-24 06:23:06.998973: step: 1004/530, loss: 0.017336059361696243 2023-01-24 06:23:08.029367: step: 1008/530, loss: 0.00043345935409888625 2023-01-24 06:23:09.070185: step: 1012/530, loss: 0.009619265794754028 2023-01-24 06:23:10.130402: step: 1016/530, loss: 0.0039932867512106895 2023-01-24 06:23:11.199419: step: 1020/530, loss: 0.0015555518912151456 2023-01-24 06:23:12.238706: step: 1024/530, loss: 0.010970303788781166 2023-01-24 06:23:13.270518: step: 1028/530, loss: 0.014511861838400364 2023-01-24 06:23:14.310245: step: 1032/530, loss: 0.0016790189547464252 2023-01-24 06:23:15.367524: step: 1036/530, loss: 0.0051798587664961815 2023-01-24 06:23:16.400224: step: 1040/530, loss: 0.006959626916795969 2023-01-24 06:23:17.458797: step: 1044/530, loss: 0.007949652150273323 2023-01-24 06:23:18.497503: step: 1048/530, loss: 0.009618671610951424 2023-01-24 06:23:19.539917: step: 1052/530, loss: 0.0061713093891739845 2023-01-24 06:23:20.591400: step: 1056/530, loss: 0.0021594311110675335 2023-01-24 06:23:21.627986: step: 1060/530, loss: 0.006789663806557655 2023-01-24 06:23:22.677604: step: 1064/530, loss: 0.0050207884050905704 2023-01-24 06:23:23.708612: step: 1068/530, loss: 0.009896758943796158 2023-01-24 06:23:24.751665: step: 1072/530, loss: 0.001345921540632844 2023-01-24 06:23:25.771224: step: 1076/530, loss: 0.004463690798729658 2023-01-24 06:23:26.828894: step: 1080/530, loss: 0.008156121708452702 2023-01-24 06:23:27.889640: step: 1084/530, loss: 0.0011514750076457858 2023-01-24 06:23:28.922951: step: 1088/530, loss: 0.012830271385610104 2023-01-24 06:23:29.969657: step: 1092/530, loss: 0.004054079297930002 2023-01-24 06:23:31.005923: step: 1096/530, loss: 0.00606739055365324 2023-01-24 06:23:32.047242: step: 1100/530, loss: 0.0023006938863545656 2023-01-24 06:23:33.086665: step: 1104/530, loss: 0.003015143098309636 2023-01-24 06:23:34.128390: step: 1108/530, loss: 0.0005504557047970593 2023-01-24 06:23:35.186310: step: 1112/530, loss: 0.009094920940697193 2023-01-24 06:23:36.244294: step: 1116/530, loss: 0.00686934357509017 2023-01-24 06:23:37.300321: step: 1120/530, loss: 0.009619171731173992 2023-01-24 06:23:38.345445: step: 1124/530, loss: 0.00299668125808239 2023-01-24 06:23:39.386503: step: 1128/530, loss: 0.0014781909994781017 2023-01-24 06:23:40.441967: step: 1132/530, loss: 0.0006976496079005301 2023-01-24 06:23:41.480856: step: 1136/530, loss: 0.033183954656124115 2023-01-24 06:23:42.518364: step: 1140/530, loss: 0.0017599496059119701 2023-01-24 06:23:43.579206: step: 1144/530, loss: 0.004342691972851753 2023-01-24 06:23:44.612541: step: 1148/530, loss: 0.0027980192098766565 2023-01-24 06:23:45.644714: step: 1152/530, loss: 0.0007540630758740008 2023-01-24 06:23:46.688463: step: 1156/530, loss: 0.005419062450528145 2023-01-24 06:23:47.735356: step: 1160/530, loss: 0.0004526493139564991 2023-01-24 06:23:48.792411: step: 1164/530, loss: 0.007975961081683636 2023-01-24 06:23:49.833545: step: 1168/530, loss: 0.005577439442276955 2023-01-24 06:23:50.895921: step: 1172/530, loss: 0.008031746372580528 2023-01-24 06:23:51.953368: step: 1176/530, loss: 0.006097746547311544 2023-01-24 06:23:52.992293: step: 1180/530, loss: 0.0027745519764721394 2023-01-24 06:23:54.034987: step: 1184/530, loss: 0.0011434364132583141 2023-01-24 06:23:55.071224: step: 1188/530, loss: 0.008492808789014816 2023-01-24 06:23:56.107306: step: 1192/530, loss: 0.020877238363027573 2023-01-24 06:23:57.166032: step: 1196/530, loss: 0.0038514393381774426 2023-01-24 06:23:58.192102: step: 1200/530, loss: 0.0017219502478837967 2023-01-24 06:23:59.250430: step: 1204/530, loss: 0.02591611258685589 2023-01-24 06:24:00.279316: step: 1208/530, loss: 0.0024388241581618786 2023-01-24 06:24:01.331029: step: 1212/530, loss: 0.008103693835437298 2023-01-24 06:24:02.378846: step: 1216/530, loss: 0.0017703513149172068 2023-01-24 06:24:03.429491: step: 1220/530, loss: 0.008272632025182247 2023-01-24 06:24:04.488512: step: 1224/530, loss: 0.0572965033352375 2023-01-24 06:24:05.525349: step: 1228/530, loss: 0.0006666359840892255 2023-01-24 06:24:06.578655: step: 1232/530, loss: 0.004535286221653223 2023-01-24 06:24:07.642096: step: 1236/530, loss: 0.01695200987160206 2023-01-24 06:24:08.675442: step: 1240/530, loss: 0.00516910944133997 2023-01-24 06:24:09.721648: step: 1244/530, loss: 0.011784598231315613 2023-01-24 06:24:10.760814: step: 1248/530, loss: 0.004188059363514185 2023-01-24 06:24:11.810430: step: 1252/530, loss: 0.0030765607953071594 2023-01-24 06:24:12.850056: step: 1256/530, loss: 0.009448111057281494 2023-01-24 06:24:13.902935: step: 1260/530, loss: 0.009654028341174126 2023-01-24 06:24:14.951998: step: 1264/530, loss: 0.0035153296776115894 2023-01-24 06:24:16.009316: step: 1268/530, loss: 0.020746583119034767 2023-01-24 06:24:17.059986: step: 1272/530, loss: 0.01471230573952198 2023-01-24 06:24:18.111514: step: 1276/530, loss: 0.04179929941892624 2023-01-24 06:24:19.151121: step: 1280/530, loss: 0.01124724093824625 2023-01-24 06:24:20.212152: step: 1284/530, loss: 0.012675424106419086 2023-01-24 06:24:21.269910: step: 1288/530, loss: 0.03778376057744026 2023-01-24 06:24:22.342100: step: 1292/530, loss: 0.009309976361691952 2023-01-24 06:24:23.425860: step: 1296/530, loss: 0.0157157015055418 2023-01-24 06:24:24.469778: step: 1300/530, loss: 0.004673982039093971 2023-01-24 06:24:25.513303: step: 1304/530, loss: 0.015413263812661171 2023-01-24 06:24:26.590621: step: 1308/530, loss: 0.03117533028125763 2023-01-24 06:24:27.634682: step: 1312/530, loss: 0.009356277994811535 2023-01-24 06:24:28.670812: step: 1316/530, loss: 0.0004866087401751429 2023-01-24 06:24:29.707220: step: 1320/530, loss: 0.00893944501876831 2023-01-24 06:24:30.751183: step: 1324/530, loss: 0.00032654768438078463 2023-01-24 06:24:31.799891: step: 1328/530, loss: 0.003849738510325551 2023-01-24 06:24:32.840434: step: 1332/530, loss: 0.0030810150783509016 2023-01-24 06:24:33.886271: step: 1336/530, loss: 0.002669693436473608 2023-01-24 06:24:34.928065: step: 1340/530, loss: 0.007426968310028315 2023-01-24 06:24:35.986067: step: 1344/530, loss: 0.00268171401694417 2023-01-24 06:24:37.038887: step: 1348/530, loss: 0.005337265320122242 2023-01-24 06:24:38.087523: step: 1352/530, loss: 0.006659374572336674 2023-01-24 06:24:39.140444: step: 1356/530, loss: 0.008167142979800701 2023-01-24 06:24:40.176222: step: 1360/530, loss: 0.003705062670633197 2023-01-24 06:24:41.217884: step: 1364/530, loss: 1.6634365238132887e-05 2023-01-24 06:24:42.253101: step: 1368/530, loss: 0.00021377854864113033 2023-01-24 06:24:43.280768: step: 1372/530, loss: 0.0007707129116170108 2023-01-24 06:24:44.329868: step: 1376/530, loss: 0.00490058958530426 2023-01-24 06:24:45.385319: step: 1380/530, loss: 0.004877751227468252 2023-01-24 06:24:46.427984: step: 1384/530, loss: 0.005202609114348888 2023-01-24 06:24:47.459435: step: 1388/530, loss: 0.004492300562560558 2023-01-24 06:24:48.498649: step: 1392/530, loss: 0.01172257773578167 2023-01-24 06:24:49.560118: step: 1396/530, loss: 0.0003633679007180035 2023-01-24 06:24:50.602937: step: 1400/530, loss: 0.004841018933802843 2023-01-24 06:24:51.651087: step: 1404/530, loss: 0.0068899798206985 2023-01-24 06:24:52.712939: step: 1408/530, loss: 0.00931174959987402 2023-01-24 06:24:53.770932: step: 1412/530, loss: 0.0010873842984437943 2023-01-24 06:24:54.811980: step: 1416/530, loss: 0.0012167481472715735 2023-01-24 06:24:55.847481: step: 1420/530, loss: 0.002931437687948346 2023-01-24 06:24:56.876127: step: 1424/530, loss: 0.010780932381749153 2023-01-24 06:24:57.928885: step: 1428/530, loss: 0.01095562893897295 2023-01-24 06:24:58.975031: step: 1432/530, loss: 0.005082893185317516 2023-01-24 06:25:00.037135: step: 1436/530, loss: 0.027777351438999176 2023-01-24 06:25:01.062328: step: 1440/530, loss: 0.008518178015947342 2023-01-24 06:25:02.102070: step: 1444/530, loss: 0.008129827678203583 2023-01-24 06:25:03.152150: step: 1448/530, loss: 0.00014765679952688515 2023-01-24 06:25:04.222827: step: 1452/530, loss: 0.003138082567602396 2023-01-24 06:25:05.277138: step: 1456/530, loss: 0.0010229966137558222 2023-01-24 06:25:06.330988: step: 1460/530, loss: 0.0009907567873597145 2023-01-24 06:25:07.394158: step: 1464/530, loss: 0.039192862808704376 2023-01-24 06:25:08.448294: step: 1468/530, loss: 0.003133070422336459 2023-01-24 06:25:09.507233: step: 1472/530, loss: 0.006975098047405481 2023-01-24 06:25:10.531403: step: 1476/530, loss: 0.005560264922678471 2023-01-24 06:25:11.583549: step: 1480/530, loss: 0.002051321789622307 2023-01-24 06:25:12.608337: step: 1484/530, loss: 0.007071810774505138 2023-01-24 06:25:13.655447: step: 1488/530, loss: 0.003039976581931114 2023-01-24 06:25:14.716927: step: 1492/530, loss: 0.0081557035446167 2023-01-24 06:25:15.760428: step: 1496/530, loss: 0.0017127173487097025 2023-01-24 06:25:16.807300: step: 1500/530, loss: 0.004103124141693115 2023-01-24 06:25:17.874017: step: 1504/530, loss: 0.0076441168785095215 2023-01-24 06:25:18.922625: step: 1508/530, loss: 0.003528046887367964 2023-01-24 06:25:19.953141: step: 1512/530, loss: 0.00017241571913473308 2023-01-24 06:25:21.001126: step: 1516/530, loss: 0.03309021145105362 2023-01-24 06:25:22.051353: step: 1520/530, loss: 0.0021175690926611423 2023-01-24 06:25:23.092651: step: 1524/530, loss: 5.452296682051383e-05 2023-01-24 06:25:24.141902: step: 1528/530, loss: 0.005031760782003403 2023-01-24 06:25:25.178776: step: 1532/530, loss: 0.009345093742012978 2023-01-24 06:25:26.203426: step: 1536/530, loss: 0.00022777014237362891 2023-01-24 06:25:27.242179: step: 1540/530, loss: 0.00560781778767705 2023-01-24 06:25:28.284006: step: 1544/530, loss: 0.003189577255398035 2023-01-24 06:25:29.328120: step: 1548/530, loss: 0.034571677446365356 2023-01-24 06:25:30.388369: step: 1552/530, loss: 0.010642732493579388 2023-01-24 06:25:31.416828: step: 1556/530, loss: 0.010461527854204178 2023-01-24 06:25:32.450965: step: 1560/530, loss: 0.006962204352021217 2023-01-24 06:25:33.483861: step: 1564/530, loss: 0.00022156462364364415 2023-01-24 06:25:34.553945: step: 1568/530, loss: 0.01962459459900856 2023-01-24 06:25:35.603123: step: 1572/530, loss: 0.024988656863570213 2023-01-24 06:25:36.671027: step: 1576/530, loss: 0.0006200416246429086 2023-01-24 06:25:37.712973: step: 1580/530, loss: 0.001931198756210506 2023-01-24 06:25:38.785837: step: 1584/530, loss: 0.0051574138924479485 2023-01-24 06:25:39.851662: step: 1588/530, loss: 0.002465372672304511 2023-01-24 06:25:40.915311: step: 1592/530, loss: 0.005042010452598333 2023-01-24 06:25:41.963490: step: 1596/530, loss: 0.001665488351136446 2023-01-24 06:25:43.007392: step: 1600/530, loss: 0.0028303733561187983 2023-01-24 06:25:44.037580: step: 1604/530, loss: 0.0056994580663740635 2023-01-24 06:25:45.066819: step: 1608/530, loss: 0.022639593109488487 2023-01-24 06:25:46.112751: step: 1612/530, loss: 0.011843492276966572 2023-01-24 06:25:47.157539: step: 1616/530, loss: 0.005340182688087225 2023-01-24 06:25:48.203022: step: 1620/530, loss: 0.013917685486376286 2023-01-24 06:25:49.246426: step: 1624/530, loss: 0.0009470715885981917 2023-01-24 06:25:50.327258: step: 1628/530, loss: 0.004929047543555498 2023-01-24 06:25:51.354883: step: 1632/530, loss: 0.003021953394636512 2023-01-24 06:25:52.410202: step: 1636/530, loss: 0.007950888946652412 2023-01-24 06:25:53.461000: step: 1640/530, loss: 0.012573221698403358 2023-01-24 06:25:54.498929: step: 1644/530, loss: 0.002465897938236594 2023-01-24 06:25:55.539864: step: 1648/530, loss: 0.004494422115385532 2023-01-24 06:25:56.576364: step: 1652/530, loss: 0.009269678965210915 2023-01-24 06:25:57.634669: step: 1656/530, loss: 0.007741387467831373 2023-01-24 06:25:58.691285: step: 1660/530, loss: 0.0027917560655623674 2023-01-24 06:25:59.731427: step: 1664/530, loss: 0.010698728263378143 2023-01-24 06:26:00.776181: step: 1668/530, loss: 0.033907629549503326 2023-01-24 06:26:01.813481: step: 1672/530, loss: 0.00538603775203228 2023-01-24 06:26:02.849448: step: 1676/530, loss: 0.013717618770897388 2023-01-24 06:26:03.899849: step: 1680/530, loss: 0.04286370426416397 2023-01-24 06:26:04.939695: step: 1684/530, loss: 0.001058622496202588 2023-01-24 06:26:05.992373: step: 1688/530, loss: 0.007325112819671631 2023-01-24 06:26:07.029979: step: 1692/530, loss: 0.001125282607972622 2023-01-24 06:26:08.090456: step: 1696/530, loss: 0.02404114417731762 2023-01-24 06:26:09.125171: step: 1700/530, loss: 0.009457694366574287 2023-01-24 06:26:10.170677: step: 1704/530, loss: 0.0050507597625255585 2023-01-24 06:26:11.209246: step: 1708/530, loss: 0.011520587839186192 2023-01-24 06:26:12.242564: step: 1712/530, loss: 0.005167321301996708 2023-01-24 06:26:13.278592: step: 1716/530, loss: 0.000495509710162878 2023-01-24 06:26:14.324211: step: 1720/530, loss: 0.04686035215854645 2023-01-24 06:26:15.349032: step: 1724/530, loss: 0.004802131559699774 2023-01-24 06:26:16.393244: step: 1728/530, loss: 0.027188561856746674 2023-01-24 06:26:17.435576: step: 1732/530, loss: 0.0045398324728012085 2023-01-24 06:26:18.491531: step: 1736/530, loss: 0.00954074040055275 2023-01-24 06:26:19.560121: step: 1740/530, loss: 0.02895531803369522 2023-01-24 06:26:20.595140: step: 1744/530, loss: 0.007887580431997776 2023-01-24 06:26:21.634160: step: 1748/530, loss: 0.006940619088709354 2023-01-24 06:26:22.683136: step: 1752/530, loss: 0.014873044565320015 2023-01-24 06:26:23.734519: step: 1756/530, loss: 0.013985712081193924 2023-01-24 06:26:24.783089: step: 1760/530, loss: 0.0066060591489076614 2023-01-24 06:26:25.832389: step: 1764/530, loss: 0.0035264333710074425 2023-01-24 06:26:26.871192: step: 1768/530, loss: 0.007560395170003176 2023-01-24 06:26:27.906070: step: 1772/530, loss: 0.003613527398556471 2023-01-24 06:26:28.944406: step: 1776/530, loss: 0.008606057614088058 2023-01-24 06:26:29.979217: step: 1780/530, loss: 0.005605859681963921 2023-01-24 06:26:31.022510: step: 1784/530, loss: 0.009676764719188213 2023-01-24 06:26:32.059852: step: 1788/530, loss: 0.0035846084356307983 2023-01-24 06:26:33.104945: step: 1792/530, loss: 0.02194957062602043 2023-01-24 06:26:34.129734: step: 1796/530, loss: 0.0011832561576738954 2023-01-24 06:26:35.174224: step: 1800/530, loss: 0.005594130605459213 2023-01-24 06:26:36.211026: step: 1804/530, loss: 0.0002772388979792595 2023-01-24 06:26:37.255670: step: 1808/530, loss: 0.012176196090877056 2023-01-24 06:26:38.291371: step: 1812/530, loss: 0.012571971863508224 2023-01-24 06:26:39.329953: step: 1816/530, loss: 0.0014177965931594372 2023-01-24 06:26:40.373642: step: 1820/530, loss: 0.009228182956576347 2023-01-24 06:26:41.412906: step: 1824/530, loss: 0.0022225137799978256 2023-01-24 06:26:42.455320: step: 1828/530, loss: 0.004359425976872444 2023-01-24 06:26:43.479401: step: 1832/530, loss: 0.0091276029124856 2023-01-24 06:26:44.527777: step: 1836/530, loss: 0.0047169518657028675 2023-01-24 06:26:45.577394: step: 1840/530, loss: 0.006618256215006113 2023-01-24 06:26:46.634256: step: 1844/530, loss: 0.010478464886546135 2023-01-24 06:26:47.681618: step: 1848/530, loss: 0.011988803744316101 2023-01-24 06:26:48.716321: step: 1852/530, loss: 0.0010404754430055618 2023-01-24 06:26:49.746350: step: 1856/530, loss: 0.00516689196228981 2023-01-24 06:26:50.783900: step: 1860/530, loss: 0.008548935875296593 2023-01-24 06:26:51.823101: step: 1864/530, loss: 0.0006177427130751312 2023-01-24 06:26:52.884433: step: 1868/530, loss: 0.009331200271844864 2023-01-24 06:26:53.909630: step: 1872/530, loss: 0.013278198428452015 2023-01-24 06:26:54.976257: step: 1876/530, loss: 0.0013035439187660813 2023-01-24 06:26:56.021159: step: 1880/530, loss: 0.004163411911576986 2023-01-24 06:26:57.080758: step: 1884/530, loss: 0.0009789917385205626 2023-01-24 06:26:58.137301: step: 1888/530, loss: 0.005735444836318493 2023-01-24 06:26:59.178193: step: 1892/530, loss: 0.016716675832867622 2023-01-24 06:27:00.210050: step: 1896/530, loss: 0.010332795791327953 2023-01-24 06:27:01.247923: step: 1900/530, loss: 0.0139173474162817 2023-01-24 06:27:02.289518: step: 1904/530, loss: 0.0194231066852808 2023-01-24 06:27:03.316901: step: 1908/530, loss: 0.009279022924602032 2023-01-24 06:27:04.369394: step: 1912/530, loss: 0.0007891654968261719 2023-01-24 06:27:05.414604: step: 1916/530, loss: 0.012249928899109364 2023-01-24 06:27:06.440905: step: 1920/530, loss: 0.002090978669002652 2023-01-24 06:27:07.475340: step: 1924/530, loss: 0.014435498043894768 2023-01-24 06:27:08.526157: step: 1928/530, loss: 0.03690756484866142 2023-01-24 06:27:09.572382: step: 1932/530, loss: 0.012080319225788116 2023-01-24 06:27:10.609031: step: 1936/530, loss: 0.001113247824832797 2023-01-24 06:27:11.663674: step: 1940/530, loss: 0.017281649634242058 2023-01-24 06:27:12.712200: step: 1944/530, loss: 0.0026332216802984476 2023-01-24 06:27:13.758175: step: 1948/530, loss: 0.00022906468075234443 2023-01-24 06:27:14.801266: step: 1952/530, loss: 0.02236367017030716 2023-01-24 06:27:15.831270: step: 1956/530, loss: 0.009231156669557095 2023-01-24 06:27:16.891514: step: 1960/530, loss: 0.0034171987790614367 2023-01-24 06:27:17.953685: step: 1964/530, loss: 0.003969093319028616 2023-01-24 06:27:18.994989: step: 1968/530, loss: 0.012047340162098408 2023-01-24 06:27:20.033617: step: 1972/530, loss: 0.0021097136195749044 2023-01-24 06:27:21.075241: step: 1976/530, loss: 0.009480580687522888 2023-01-24 06:27:22.115783: step: 1980/530, loss: 0.0002342582738492638 2023-01-24 06:27:23.145649: step: 1984/530, loss: 0.0166630819439888 2023-01-24 06:27:24.199117: step: 1988/530, loss: 0.002624457934871316 2023-01-24 06:27:25.234592: step: 1992/530, loss: 0.004591317847371101 2023-01-24 06:27:26.260962: step: 1996/530, loss: 0.011766986921429634 2023-01-24 06:27:27.304274: step: 2000/530, loss: 0.009464697912335396 2023-01-24 06:27:28.347782: step: 2004/530, loss: 0.013496533036231995 2023-01-24 06:27:29.386229: step: 2008/530, loss: 0.0018837039824575186 2023-01-24 06:27:30.428880: step: 2012/530, loss: 0.0042829993180930614 2023-01-24 06:27:31.465771: step: 2016/530, loss: 0.009306607767939568 2023-01-24 06:27:32.500490: step: 2020/530, loss: 0.012653127312660217 2023-01-24 06:27:33.530034: step: 2024/530, loss: 0.007929597981274128 2023-01-24 06:27:34.579195: step: 2028/530, loss: 0.00470797810703516 2023-01-24 06:27:35.620540: step: 2032/530, loss: 0.0014896313659846783 2023-01-24 06:27:36.664984: step: 2036/530, loss: 0.007710399106144905 2023-01-24 06:27:37.717166: step: 2040/530, loss: 0.0028835029806941748 2023-01-24 06:27:38.757718: step: 2044/530, loss: 0.0026091367471963167 2023-01-24 06:27:39.816772: step: 2048/530, loss: 0.005126492120325565 2023-01-24 06:27:40.847498: step: 2052/530, loss: 0.055129051208496094 2023-01-24 06:27:41.887538: step: 2056/530, loss: 0.01895103231072426 2023-01-24 06:27:42.921971: step: 2060/530, loss: 0.0013110397849231958 2023-01-24 06:27:43.962664: step: 2064/530, loss: 0.003503028303384781 2023-01-24 06:27:45.002521: step: 2068/530, loss: 0.00581095227971673 2023-01-24 06:27:46.040070: step: 2072/530, loss: 0.00411786325275898 2023-01-24 06:27:47.078992: step: 2076/530, loss: 0.005775300785899162 2023-01-24 06:27:48.109746: step: 2080/530, loss: 0.017651807516813278 2023-01-24 06:27:49.145658: step: 2084/530, loss: 0.005945092067122459 2023-01-24 06:27:50.195712: step: 2088/530, loss: 0.017199594527482986 2023-01-24 06:27:51.239086: step: 2092/530, loss: 0.001704596565105021 2023-01-24 06:27:52.291372: step: 2096/530, loss: 0.010168765671551228 2023-01-24 06:27:53.336590: step: 2100/530, loss: 0.0018051320221275091 2023-01-24 06:27:54.369676: step: 2104/530, loss: 0.014632332138717175 2023-01-24 06:27:55.410971: step: 2108/530, loss: 0.011417794041335583 2023-01-24 06:27:56.441204: step: 2112/530, loss: 0.0013669944601133466 2023-01-24 06:27:57.467982: step: 2116/530, loss: 0.0018338194349780679 2023-01-24 06:27:58.497487: step: 2120/530, loss: 0.002114777220413089 ================================================== Loss: 0.009 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.371044481981982, 'r': 0.31260673624288426, 'f1': 0.33932801235839344}, 'combined': 0.2500311670009215, 'stategy': 1, 'epoch': 7} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3773299117490305, 'r': 0.3898150926524911, 'f1': 0.38347090488780317}, 'combined': 0.29723582101351254, 'stategy': 1, 'epoch': 7} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3910125811688312, 'r': 0.3264621171049065, 'f1': 0.3558335795538485}, 'combined': 0.2621931638817831, 'stategy': 1, 'epoch': 7} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37070452515606517, 'r': 0.3659344301632481, 'f1': 0.3683040333187918}, 'combined': 0.28547968132844154, 'stategy': 1, 'epoch': 7} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38898325469855033, 'r': 0.33141078056859413, 'f1': 0.3578964781960023}, 'combined': 0.2637131944602122, 'stategy': 1, 'epoch': 7} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36526204478413765, 'r': 0.36391916961949006, 'f1': 0.3645893706685131}, 'combined': 0.2826003734368379, 'stategy': 1, 'epoch': 7} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4, 'r': 0.2857142857142857, 'f1': 0.3333333333333333}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 7} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 7} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 7} New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38898325469855033, 'r': 0.33141078056859413, 'f1': 0.3578964781960023}, 'combined': 0.2637131944602122, 'stategy': 1, 'epoch': 7} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36526204478413765, 'r': 0.36391916961949006, 'f1': 0.3645893706685131}, 'combined': 0.2826003734368379, 'stategy': 1, 'epoch': 7} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 7} ****************************** Epoch: 8 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 06:30:25.535909: step: 4/530, loss: 0.006443020887672901 2023-01-24 06:30:26.573609: step: 8/530, loss: 0.00317304371856153 2023-01-24 06:30:27.619588: step: 12/530, loss: 0.008027322590351105 2023-01-24 06:30:28.669429: step: 16/530, loss: 0.01722724735736847 2023-01-24 06:30:29.707467: step: 20/530, loss: 0.01067101676017046 2023-01-24 06:30:30.744898: step: 24/530, loss: 0.018055465072393417 2023-01-24 06:30:31.782418: step: 28/530, loss: 0.010839723981916904 2023-01-24 06:30:32.829021: step: 32/530, loss: 0.04166977480053902 2023-01-24 06:30:33.893895: step: 36/530, loss: 0.004870374221354723 2023-01-24 06:30:34.951548: step: 40/530, loss: 0.004758880473673344 2023-01-24 06:30:36.013879: step: 44/530, loss: 0.0035378627944737673 2023-01-24 06:30:37.066540: step: 48/530, loss: 0.023192228749394417 2023-01-24 06:30:38.135398: step: 52/530, loss: 0.0012242362136021256 2023-01-24 06:30:39.185937: step: 56/530, loss: 0.011190163902938366 2023-01-24 06:30:40.230111: step: 60/530, loss: 0.011091810651123524 2023-01-24 06:30:41.271353: step: 64/530, loss: 0.006872337311506271 2023-01-24 06:30:42.304318: step: 68/530, loss: 0.0040228236466646194 2023-01-24 06:30:43.365558: step: 72/530, loss: 0.014228034764528275 2023-01-24 06:30:44.396424: step: 76/530, loss: 0.0019172192551195621 2023-01-24 06:30:45.432317: step: 80/530, loss: 0.005322155077010393 2023-01-24 06:30:46.483812: step: 84/530, loss: 0.0030950221698731184 2023-01-24 06:30:47.521623: step: 88/530, loss: 0.010197141207754612 2023-01-24 06:30:48.553437: step: 92/530, loss: 0.0058609540574252605 2023-01-24 06:30:49.585192: step: 96/530, loss: 0.0037929746322333813 2023-01-24 06:30:50.627077: step: 100/530, loss: 0.005724242422729731 2023-01-24 06:30:51.661519: step: 104/530, loss: 0.0029091271571815014 2023-01-24 06:30:52.709566: step: 108/530, loss: 0.005397266708314419 2023-01-24 06:30:53.742747: step: 112/530, loss: 0.012336493469774723 2023-01-24 06:30:54.772737: step: 116/530, loss: 0.0025623124092817307 2023-01-24 06:30:55.815473: step: 120/530, loss: 0.0015331917675212026 2023-01-24 06:30:56.864474: step: 124/530, loss: 0.007481038570404053 2023-01-24 06:30:57.918295: step: 128/530, loss: 0.005113583989441395 2023-01-24 06:30:58.954215: step: 132/530, loss: 0.00024479778949171305 2023-01-24 06:30:59.992367: step: 136/530, loss: 0.0010996824130415916 2023-01-24 06:31:01.035320: step: 140/530, loss: 0.0004907758557237685 2023-01-24 06:31:02.082648: step: 144/530, loss: 0.023959992453455925 2023-01-24 06:31:03.154511: step: 148/530, loss: 0.004271361045539379 2023-01-24 06:31:04.197621: step: 152/530, loss: 0.0033653138671070337 2023-01-24 06:31:05.236728: step: 156/530, loss: 0.009489140473306179 2023-01-24 06:31:06.294582: step: 160/530, loss: 0.0012906421907246113 2023-01-24 06:31:07.338886: step: 164/530, loss: 0.007899273186922073 2023-01-24 06:31:08.372728: step: 168/530, loss: 0.007317421957850456 2023-01-24 06:31:09.430121: step: 172/530, loss: 0.003954316955059767 2023-01-24 06:31:10.479788: step: 176/530, loss: 0.0013688422041013837 2023-01-24 06:31:11.519219: step: 180/530, loss: 0.017612328752875328 2023-01-24 06:31:12.585320: step: 184/530, loss: 0.0013631233014166355 2023-01-24 06:31:13.627640: step: 188/530, loss: 0.015199512243270874 2023-01-24 06:31:14.701014: step: 192/530, loss: 0.0046225921250879765 2023-01-24 06:31:15.759454: step: 196/530, loss: 0.0032397285103797913 2023-01-24 06:31:16.822170: step: 200/530, loss: 0.009918945841491222 2023-01-24 06:31:17.869264: step: 204/530, loss: 0.0008518360555171967 2023-01-24 06:31:18.918547: step: 208/530, loss: 0.0040648216381669044 2023-01-24 06:31:19.962491: step: 212/530, loss: 0.003091565566137433 2023-01-24 06:31:21.004286: step: 216/530, loss: 0.000684376631397754 2023-01-24 06:31:22.045751: step: 220/530, loss: 0.0028783048037439585 2023-01-24 06:31:23.089860: step: 224/530, loss: 3.2991629268508404e-05 2023-01-24 06:31:24.150806: step: 228/530, loss: 0.0013385203201323748 2023-01-24 06:31:25.211195: step: 232/530, loss: 0.014296078123152256 2023-01-24 06:31:26.256814: step: 236/530, loss: 0.01647352986037731 2023-01-24 06:31:27.305089: step: 240/530, loss: 0.005481907166540623 2023-01-24 06:31:28.349391: step: 244/530, loss: 0.015058851800858974 2023-01-24 06:31:29.399614: step: 248/530, loss: 0.0016618070658296347 2023-01-24 06:31:30.459161: step: 252/530, loss: 0.002154336078092456 2023-01-24 06:31:31.494879: step: 256/530, loss: 0.010336115956306458 2023-01-24 06:31:32.543828: step: 260/530, loss: 0.003075753804296255 2023-01-24 06:31:33.585341: step: 264/530, loss: 0.003258376382291317 2023-01-24 06:31:34.626605: step: 268/530, loss: 0.0054964106529951096 2023-01-24 06:31:35.670601: step: 272/530, loss: 0.012814630754292011 2023-01-24 06:31:36.717733: step: 276/530, loss: 0.007176750805228949 2023-01-24 06:31:37.764138: step: 280/530, loss: 0.0068128290586173534 2023-01-24 06:31:38.814316: step: 284/530, loss: 0.005921709351241589 2023-01-24 06:31:39.857668: step: 288/530, loss: 0.0019552442245185375 2023-01-24 06:31:40.915773: step: 292/530, loss: 0.013440625742077827 2023-01-24 06:31:41.956111: step: 296/530, loss: 0.004721327684819698 2023-01-24 06:31:43.015703: step: 300/530, loss: 0.014077827334403992 2023-01-24 06:31:44.081506: step: 304/530, loss: 0.01970062404870987 2023-01-24 06:31:45.131866: step: 308/530, loss: 0.008239652030169964 2023-01-24 06:31:46.171718: step: 312/530, loss: 0.008537107147276402 2023-01-24 06:31:47.220408: step: 316/530, loss: 0.024481305852532387 2023-01-24 06:31:48.259827: step: 320/530, loss: 0.0008368688868358731 2023-01-24 06:31:49.308104: step: 324/530, loss: 0.010338678024709225 2023-01-24 06:31:50.350970: step: 328/530, loss: 0.016843730583786964 2023-01-24 06:31:51.395966: step: 332/530, loss: 0.007332807872444391 2023-01-24 06:31:52.466884: step: 336/530, loss: 0.015916921198368073 2023-01-24 06:31:53.520651: step: 340/530, loss: 0.027416598051786423 2023-01-24 06:31:54.567962: step: 344/530, loss: 0.015442077070474625 2023-01-24 06:31:55.607616: step: 348/530, loss: 0.003721862332895398 2023-01-24 06:31:56.639923: step: 352/530, loss: 0.017598453909158707 2023-01-24 06:31:57.692432: step: 356/530, loss: 0.0043983543291687965 2023-01-24 06:31:58.743181: step: 360/530, loss: 0.004982681013643742 2023-01-24 06:31:59.775200: step: 364/530, loss: 0.007238171994686127 2023-01-24 06:32:00.829774: step: 368/530, loss: 0.004519812762737274 2023-01-24 06:32:01.891387: step: 372/530, loss: 0.00703876418992877 2023-01-24 06:32:02.945140: step: 376/530, loss: 0.001871192711405456 2023-01-24 06:32:03.976979: step: 380/530, loss: 0.000646625820081681 2023-01-24 06:32:05.012670: step: 384/530, loss: 0.006171062588691711 2023-01-24 06:32:06.075149: step: 388/530, loss: 0.01040917169302702 2023-01-24 06:32:07.123191: step: 392/530, loss: 0.008386931382119656 2023-01-24 06:32:08.183655: step: 396/530, loss: 0.004858999978750944 2023-01-24 06:32:09.248386: step: 400/530, loss: 0.0013101871591061354 2023-01-24 06:32:10.303041: step: 404/530, loss: 0.0023410820867866278 2023-01-24 06:32:11.351420: step: 408/530, loss: 0.008878541179001331 2023-01-24 06:32:12.392186: step: 412/530, loss: 0.006445564795285463 2023-01-24 06:32:13.436574: step: 416/530, loss: 0.003902277210727334 2023-01-24 06:32:14.498515: step: 420/530, loss: 0.002342721913009882 2023-01-24 06:32:15.547430: step: 424/530, loss: 0.005214674398303032 2023-01-24 06:32:16.605442: step: 428/530, loss: 0.007068710867315531 2023-01-24 06:32:17.651367: step: 432/530, loss: 0.006550357211381197 2023-01-24 06:32:18.714422: step: 436/530, loss: 0.005082268733531237 2023-01-24 06:32:19.756246: step: 440/530, loss: 0.008528613485395908 2023-01-24 06:32:20.797021: step: 444/530, loss: 0.009027947671711445 2023-01-24 06:32:21.839462: step: 448/530, loss: 0.00039609186933375895 2023-01-24 06:32:22.884492: step: 452/530, loss: 0.018422113731503487 2023-01-24 06:32:23.924003: step: 456/530, loss: 0.0049692667089402676 2023-01-24 06:32:24.976203: step: 460/530, loss: 0.012376712635159492 2023-01-24 06:32:26.025667: step: 464/530, loss: 0.002245863899588585 2023-01-24 06:32:27.064620: step: 468/530, loss: 0.008253208361566067 2023-01-24 06:32:28.111751: step: 472/530, loss: 0.01068258285522461 2023-01-24 06:32:29.153442: step: 476/530, loss: 0.015965888276696205 2023-01-24 06:32:30.180070: step: 480/530, loss: 0.0020470772869884968 2023-01-24 06:32:31.210420: step: 484/530, loss: 0.006847771350294352 2023-01-24 06:32:32.253359: step: 488/530, loss: 0.0016153039177879691 2023-01-24 06:32:33.325348: step: 492/530, loss: 0.021052658557891846 2023-01-24 06:32:34.374923: step: 496/530, loss: 0.0015370118198916316 2023-01-24 06:32:35.419976: step: 500/530, loss: 0.003250798210501671 2023-01-24 06:32:36.457708: step: 504/530, loss: 1.4903104101904319e-06 2023-01-24 06:32:37.505539: step: 508/530, loss: 0.003133803838863969 2023-01-24 06:32:38.542347: step: 512/530, loss: 0.015905944630503654 2023-01-24 06:32:39.593688: step: 516/530, loss: 0.00484615471214056 2023-01-24 06:32:40.640799: step: 520/530, loss: 0.004640527069568634 2023-01-24 06:32:41.672030: step: 524/530, loss: 0.004660589620471001 2023-01-24 06:32:42.738695: step: 528/530, loss: 0.007647755090147257 2023-01-24 06:32:43.777980: step: 532/530, loss: 0.0005355802131816745 2023-01-24 06:32:44.811751: step: 536/530, loss: 0.0021537370048463345 2023-01-24 06:32:45.857317: step: 540/530, loss: 0.00440042233094573 2023-01-24 06:32:46.893694: step: 544/530, loss: 0.0011832388117909431 2023-01-24 06:32:47.966770: step: 548/530, loss: 0.008624980226159096 2023-01-24 06:32:49.021697: step: 552/530, loss: 0.003169151721522212 2023-01-24 06:32:50.078541: step: 556/530, loss: 0.00429248483851552 2023-01-24 06:32:51.143602: step: 560/530, loss: 0.0509367473423481 2023-01-24 06:32:52.216247: step: 564/530, loss: 0.01222795620560646 2023-01-24 06:32:53.265813: step: 568/530, loss: 0.01895686239004135 2023-01-24 06:32:54.321893: step: 572/530, loss: 0.004771255422383547 2023-01-24 06:32:55.359406: step: 576/530, loss: 0.0001255811075679958 2023-01-24 06:32:56.416297: step: 580/530, loss: 0.0038223492447286844 2023-01-24 06:32:57.468627: step: 584/530, loss: 0.002349498216062784 2023-01-24 06:32:58.501185: step: 588/530, loss: 0.0036266311071813107 2023-01-24 06:32:59.532646: step: 592/530, loss: 0.00019072755821980536 2023-01-24 06:33:00.578414: step: 596/530, loss: 0.005181869957596064 2023-01-24 06:33:01.637037: step: 600/530, loss: 0.007897347211837769 2023-01-24 06:33:02.688012: step: 604/530, loss: 0.006267680786550045 2023-01-24 06:33:03.736484: step: 608/530, loss: 0.006488562095910311 2023-01-24 06:33:04.783295: step: 612/530, loss: 0.034043002873659134 2023-01-24 06:33:05.819426: step: 616/530, loss: 0.009407413192093372 2023-01-24 06:33:06.868000: step: 620/530, loss: 0.0329255610704422 2023-01-24 06:33:07.915626: step: 624/530, loss: 0.016118628904223442 2023-01-24 06:33:08.969093: step: 628/530, loss: 0.009390652179718018 2023-01-24 06:33:09.998714: step: 632/530, loss: 0.006520468275994062 2023-01-24 06:33:11.030134: step: 636/530, loss: 0.0053998189978301525 2023-01-24 06:33:12.082467: step: 640/530, loss: 0.0018274616450071335 2023-01-24 06:33:13.121145: step: 644/530, loss: 0.010771005414426327 2023-01-24 06:33:14.168075: step: 648/530, loss: 0.007071325089782476 2023-01-24 06:33:15.220121: step: 652/530, loss: 0.007078418042510748 2023-01-24 06:33:16.260928: step: 656/530, loss: 0.005073783919215202 2023-01-24 06:33:17.308687: step: 660/530, loss: 0.006542540155351162 2023-01-24 06:33:18.354939: step: 664/530, loss: 0.007633148226886988 2023-01-24 06:33:19.406905: step: 668/530, loss: 0.019827213138341904 2023-01-24 06:33:20.442944: step: 672/530, loss: 0.002795290434733033 2023-01-24 06:33:21.480625: step: 676/530, loss: 0.0062452093698084354 2023-01-24 06:33:22.524740: step: 680/530, loss: 0.006274326704442501 2023-01-24 06:33:23.566816: step: 684/530, loss: 0.0023696166463196278 2023-01-24 06:33:24.610728: step: 688/530, loss: 0.009987825527787209 2023-01-24 06:33:25.656564: step: 692/530, loss: 0.0011304875370115042 2023-01-24 06:33:26.709776: step: 696/530, loss: 0.0034530742559581995 2023-01-24 06:33:27.747121: step: 700/530, loss: 0.004940489307045937 2023-01-24 06:33:28.798952: step: 704/530, loss: 0.003079000161960721 2023-01-24 06:33:29.825085: step: 708/530, loss: 0.0002853375917766243 2023-01-24 06:33:30.897772: step: 712/530, loss: 0.008336411789059639 2023-01-24 06:33:31.953292: step: 716/530, loss: 0.00026188010815531015 2023-01-24 06:33:32.989073: step: 720/530, loss: 0.00022757177066523582 2023-01-24 06:33:34.033854: step: 724/530, loss: 0.0132845314219594 2023-01-24 06:33:35.069875: step: 728/530, loss: 0.006128624081611633 2023-01-24 06:33:36.112472: step: 732/530, loss: 0.006772862281650305 2023-01-24 06:33:37.155024: step: 736/530, loss: 0.01080066803842783 2023-01-24 06:33:38.203697: step: 740/530, loss: 0.0018177388701587915 2023-01-24 06:33:39.227122: step: 744/530, loss: 0.004945053718984127 2023-01-24 06:33:40.278636: step: 748/530, loss: 0.006223143078386784 2023-01-24 06:33:41.327815: step: 752/530, loss: 0.001619755057618022 2023-01-24 06:33:42.370929: step: 756/530, loss: 0.0038573327474296093 2023-01-24 06:33:43.427092: step: 760/530, loss: 0.0326252356171608 2023-01-24 06:33:44.467132: step: 764/530, loss: 0.02476155012845993 2023-01-24 06:33:45.509121: step: 768/530, loss: 0.0029471255838871002 2023-01-24 06:33:46.555563: step: 772/530, loss: 0.0028389617800712585 2023-01-24 06:33:47.605395: step: 776/530, loss: 0.004500068258494139 2023-01-24 06:33:48.659975: step: 780/530, loss: 0.03257456421852112 2023-01-24 06:33:49.726781: step: 784/530, loss: 0.004930510651320219 2023-01-24 06:33:50.785669: step: 788/530, loss: 0.004476903006434441 2023-01-24 06:33:51.831113: step: 792/530, loss: 0.0011893552727997303 2023-01-24 06:33:52.877086: step: 796/530, loss: 0.012703250162303448 2023-01-24 06:33:53.958575: step: 800/530, loss: 0.004259241744875908 2023-01-24 06:33:55.000670: step: 804/530, loss: 0.009800449945032597 2023-01-24 06:33:56.041577: step: 808/530, loss: 0.005722482688724995 2023-01-24 06:33:57.075670: step: 812/530, loss: 0.006868877448141575 2023-01-24 06:33:58.130126: step: 816/530, loss: 8.425168925896287e-05 2023-01-24 06:33:59.185509: step: 820/530, loss: 0.00022072407591622323 2023-01-24 06:34:00.251849: step: 824/530, loss: 0.007139390800148249 2023-01-24 06:34:01.298064: step: 828/530, loss: 0.0016285597812384367 2023-01-24 06:34:02.343172: step: 832/530, loss: 0.0010771198431029916 2023-01-24 06:34:03.398564: step: 836/530, loss: 0.01445038802921772 2023-01-24 06:34:04.460896: step: 840/530, loss: 0.004866424482315779 2023-01-24 06:34:05.520367: step: 844/530, loss: 0.0052887857891619205 2023-01-24 06:34:06.563164: step: 848/530, loss: 0.0034097700845450163 2023-01-24 06:34:07.610565: step: 852/530, loss: 0.005129923112690449 2023-01-24 06:34:08.652563: step: 856/530, loss: 0.02154039591550827 2023-01-24 06:34:09.711945: step: 860/530, loss: 0.005358666181564331 2023-01-24 06:34:10.768886: step: 864/530, loss: 0.0014924720162525773 2023-01-24 06:34:11.805049: step: 868/530, loss: 0.005080854054540396 2023-01-24 06:34:12.858309: step: 872/530, loss: 0.019516028463840485 2023-01-24 06:34:13.886544: step: 876/530, loss: 0.0014875243650749326 2023-01-24 06:34:14.918981: step: 880/530, loss: 0.013087298721075058 2023-01-24 06:34:15.975095: step: 884/530, loss: 0.010942541062831879 2023-01-24 06:34:17.005753: step: 888/530, loss: 0.007191112730652094 2023-01-24 06:34:18.050536: step: 892/530, loss: 0.003926681354641914 2023-01-24 06:34:19.088006: step: 896/530, loss: 0.0004315909754950553 2023-01-24 06:34:20.123989: step: 900/530, loss: 0.004317270591855049 2023-01-24 06:34:21.157983: step: 904/530, loss: 0.0015492003876715899 2023-01-24 06:34:22.202874: step: 908/530, loss: 0.0026503349654376507 2023-01-24 06:34:23.260107: step: 912/530, loss: 0.004143655765801668 2023-01-24 06:34:24.300055: step: 916/530, loss: 0.006869420874863863 2023-01-24 06:34:25.331338: step: 920/530, loss: 0.0018275945913046598 2023-01-24 06:34:26.372434: step: 924/530, loss: 0.011466322466731071 2023-01-24 06:34:27.441347: step: 928/530, loss: 0.02957484871149063 2023-01-24 06:34:28.475299: step: 932/530, loss: 0.0016847008373588324 2023-01-24 06:34:29.506026: step: 936/530, loss: 0.002385699423030019 2023-01-24 06:34:30.549539: step: 940/530, loss: 0.007095735985785723 2023-01-24 06:34:31.593255: step: 944/530, loss: 0.0009214837336912751 2023-01-24 06:34:32.641979: step: 948/530, loss: 0.007418160326778889 2023-01-24 06:34:33.678114: step: 952/530, loss: 0.006413837429136038 2023-01-24 06:34:34.737742: step: 956/530, loss: 0.0035916813649237156 2023-01-24 06:34:35.770209: step: 960/530, loss: 0.005150137469172478 2023-01-24 06:34:36.822223: step: 964/530, loss: 0.02176482044160366 2023-01-24 06:34:37.869697: step: 968/530, loss: 0.02143683284521103 2023-01-24 06:34:38.910185: step: 972/530, loss: 0.0117194764316082 2023-01-24 06:34:39.960465: step: 976/530, loss: 0.004103964660316706 2023-01-24 06:34:41.000137: step: 980/530, loss: 0.01312597468495369 2023-01-24 06:34:42.020318: step: 984/530, loss: 0.007851426489651203 2023-01-24 06:34:43.057691: step: 988/530, loss: 0.0032611184287816286 2023-01-24 06:34:44.096258: step: 992/530, loss: 0.044866736978292465 2023-01-24 06:34:45.122249: step: 996/530, loss: 0.0005240231403149664 2023-01-24 06:34:46.164485: step: 1000/530, loss: 0.009989464655518532 2023-01-24 06:34:47.203975: step: 1004/530, loss: 0.003820350393652916 2023-01-24 06:34:48.250881: step: 1008/530, loss: 0.009437700733542442 2023-01-24 06:34:49.297026: step: 1012/530, loss: 0.0017604655586183071 2023-01-24 06:34:50.325894: step: 1016/530, loss: 0.0025235763750970364 2023-01-24 06:34:51.362508: step: 1020/530, loss: 0.0037349306512624025 2023-01-24 06:34:52.395031: step: 1024/530, loss: 0.0013715805253013968 2023-01-24 06:34:53.454839: step: 1028/530, loss: 0.011247486807405949 2023-01-24 06:34:54.504183: step: 1032/530, loss: 0.003384503535926342 2023-01-24 06:34:55.549885: step: 1036/530, loss: 0.009993638843297958 2023-01-24 06:34:56.578278: step: 1040/530, loss: 0.0016267661703750491 2023-01-24 06:34:57.613133: step: 1044/530, loss: 0.006866056472063065 2023-01-24 06:34:58.648530: step: 1048/530, loss: 0.016553768888115883 2023-01-24 06:34:59.685080: step: 1052/530, loss: 0.008998163044452667 2023-01-24 06:35:00.745971: step: 1056/530, loss: 0.03297252953052521 2023-01-24 06:35:01.782215: step: 1060/530, loss: 0.021336859092116356 2023-01-24 06:35:02.831923: step: 1064/530, loss: 0.0045573231764137745 2023-01-24 06:35:03.871204: step: 1068/530, loss: 0.0048517524264752865 2023-01-24 06:35:04.923121: step: 1072/530, loss: 5.3648618631996214e-05 2023-01-24 06:35:05.962652: step: 1076/530, loss: 0.0048005483113229275 2023-01-24 06:35:07.006625: step: 1080/530, loss: 0.017492195591330528 2023-01-24 06:35:08.068689: step: 1084/530, loss: 0.002924201311543584 2023-01-24 06:35:09.121724: step: 1088/530, loss: 0.0017691574757918715 2023-01-24 06:35:10.162306: step: 1092/530, loss: 0.006907281931489706 2023-01-24 06:35:11.217405: step: 1096/530, loss: 0.003989166114479303 2023-01-24 06:35:12.249854: step: 1100/530, loss: 0.0014421823434531689 2023-01-24 06:35:13.292092: step: 1104/530, loss: 0.0005379109643399715 2023-01-24 06:35:14.334778: step: 1108/530, loss: 0.029883868992328644 2023-01-24 06:35:15.378698: step: 1112/530, loss: 0.006449008826166391 2023-01-24 06:35:16.411850: step: 1116/530, loss: 0.0029880276415497065 2023-01-24 06:35:17.449094: step: 1120/530, loss: 0.010432815179228783 2023-01-24 06:35:18.509841: step: 1124/530, loss: 0.008568570017814636 2023-01-24 06:35:19.564992: step: 1128/530, loss: 0.0017055398784577847 2023-01-24 06:35:20.604763: step: 1132/530, loss: 0.000813948514405638 2023-01-24 06:35:21.666065: step: 1136/530, loss: 0.004094402771443129 2023-01-24 06:35:22.721426: step: 1140/530, loss: 0.001564537757076323 2023-01-24 06:35:23.785069: step: 1144/530, loss: 0.00947826448827982 2023-01-24 06:35:24.815638: step: 1148/530, loss: 0.0015115514397621155 2023-01-24 06:35:25.871686: step: 1152/530, loss: 0.004356694407761097 2023-01-24 06:35:26.915642: step: 1156/530, loss: 0.008171956986188889 2023-01-24 06:35:27.946570: step: 1160/530, loss: 0.014146357774734497 2023-01-24 06:35:28.986119: step: 1164/530, loss: 0.00569186033681035 2023-01-24 06:35:30.035748: step: 1168/530, loss: 0.02225622348487377 2023-01-24 06:35:31.079438: step: 1172/530, loss: 0.05347214266657829 2023-01-24 06:35:32.110336: step: 1176/530, loss: 0.0071417526341974735 2023-01-24 06:35:33.167685: step: 1180/530, loss: 0.003233895869925618 2023-01-24 06:35:34.201367: step: 1184/530, loss: 0.007582392077893019 2023-01-24 06:35:35.259543: step: 1188/530, loss: 0.03176518902182579 2023-01-24 06:35:36.283335: step: 1192/530, loss: 0.02226613275706768 2023-01-24 06:35:37.341965: step: 1196/530, loss: 0.008522610180079937 2023-01-24 06:35:38.387082: step: 1200/530, loss: 0.004799327347427607 2023-01-24 06:35:39.417303: step: 1204/530, loss: 0.016248898580670357 2023-01-24 06:35:40.458721: step: 1208/530, loss: 0.004367674235254526 2023-01-24 06:35:41.510297: step: 1212/530, loss: 0.005273491144180298 2023-01-24 06:35:42.558623: step: 1216/530, loss: 0.0064430818893015385 2023-01-24 06:35:43.582797: step: 1220/530, loss: 0.006095066666603088 2023-01-24 06:35:44.622519: step: 1224/530, loss: 0.0018999907188117504 2023-01-24 06:35:45.653027: step: 1228/530, loss: 0.001671053934842348 2023-01-24 06:35:46.708866: step: 1232/530, loss: 0.002718855394050479 2023-01-24 06:35:47.734336: step: 1236/530, loss: 0.00263481424190104 2023-01-24 06:35:48.771596: step: 1240/530, loss: 0.0017753038555383682 2023-01-24 06:35:49.826833: step: 1244/530, loss: 0.005754063371568918 2023-01-24 06:35:50.870568: step: 1248/530, loss: 0.0019165900303050876 2023-01-24 06:35:51.903623: step: 1252/530, loss: 0.00745938066393137 2023-01-24 06:35:52.938369: step: 1256/530, loss: 0.0020056532230228186 2023-01-24 06:35:53.989086: step: 1260/530, loss: 0.0032334693241864443 2023-01-24 06:35:55.046351: step: 1264/530, loss: 0.0031998935155570507 2023-01-24 06:35:56.096460: step: 1268/530, loss: 0.007909215055406094 2023-01-24 06:35:57.124111: step: 1272/530, loss: 0.012260696850717068 2023-01-24 06:35:58.152847: step: 1276/530, loss: 0.003334488021209836 2023-01-24 06:35:59.205559: step: 1280/530, loss: 0.009210821241140366 2023-01-24 06:36:00.259289: step: 1284/530, loss: 0.012615853920578957 2023-01-24 06:36:01.306216: step: 1288/530, loss: 0.01089463196694851 2023-01-24 06:36:02.340634: step: 1292/530, loss: 0.0032961037941277027 2023-01-24 06:36:03.392315: step: 1296/530, loss: 0.005276534240692854 2023-01-24 06:36:04.433154: step: 1300/530, loss: 0.001777772675268352 2023-01-24 06:36:05.479461: step: 1304/530, loss: 0.0032450249418616295 2023-01-24 06:36:06.512150: step: 1308/530, loss: 0.008616378530859947 2023-01-24 06:36:07.548614: step: 1312/530, loss: 0.0014581545256078243 2023-01-24 06:36:08.586578: step: 1316/530, loss: 0.00254250830039382 2023-01-24 06:36:09.629432: step: 1320/530, loss: 0.014334144070744514 2023-01-24 06:36:10.691937: step: 1324/530, loss: 0.05240749567747116 2023-01-24 06:36:11.724352: step: 1328/530, loss: 0.0019484309013932943 2023-01-24 06:36:12.779182: step: 1332/530, loss: 0.0003880032163579017 2023-01-24 06:36:13.846609: step: 1336/530, loss: 0.0029791533015668392 2023-01-24 06:36:14.887596: step: 1340/530, loss: 0.0009021844016388059 2023-01-24 06:36:15.933642: step: 1344/530, loss: 0.01908363774418831 2023-01-24 06:36:16.989234: step: 1348/530, loss: 0.008514597080647945 2023-01-24 06:36:18.024567: step: 1352/530, loss: 0.018725385889410973 2023-01-24 06:36:19.061379: step: 1356/530, loss: 9.112127372645773e-06 2023-01-24 06:36:20.102306: step: 1360/530, loss: 0.007284039631485939 2023-01-24 06:36:21.140448: step: 1364/530, loss: 0.0056719123385846615 2023-01-24 06:36:22.176711: step: 1368/530, loss: 0.0002533484366722405 2023-01-24 06:36:23.227015: step: 1372/530, loss: 0.0037012940738350153 2023-01-24 06:36:24.323681: step: 1376/530, loss: 0.006074863485991955 2023-01-24 06:36:25.359244: step: 1380/530, loss: 0.008641631342470646 2023-01-24 06:36:26.407014: step: 1384/530, loss: 0.0013487815158441663 2023-01-24 06:36:27.435378: step: 1388/530, loss: 0.0063590798527002335 2023-01-24 06:36:28.475065: step: 1392/530, loss: 0.01117555983364582 2023-01-24 06:36:29.508611: step: 1396/530, loss: 0.0009980843169614673 2023-01-24 06:36:30.551355: step: 1400/530, loss: 0.01162731647491455 2023-01-24 06:36:31.587485: step: 1404/530, loss: 0.005328621249645948 2023-01-24 06:36:32.623415: step: 1408/530, loss: 0.003818571101874113 2023-01-24 06:36:33.663415: step: 1412/530, loss: 0.004043970722705126 2023-01-24 06:36:34.701236: step: 1416/530, loss: 0.004837583750486374 2023-01-24 06:36:35.753022: step: 1420/530, loss: 0.0059318398125469685 2023-01-24 06:36:36.808609: step: 1424/530, loss: 0.0014331568963825703 2023-01-24 06:36:37.875013: step: 1428/530, loss: 0.007052761502563953 2023-01-24 06:36:38.922070: step: 1432/530, loss: 0.0038785580545663834 2023-01-24 06:36:39.972291: step: 1436/530, loss: 0.0014316333690658212 2023-01-24 06:36:41.019175: step: 1440/530, loss: 0.01590970903635025 2023-01-24 06:36:42.062328: step: 1444/530, loss: 0.0 2023-01-24 06:36:43.109359: step: 1448/530, loss: 0.0015100068412721157 2023-01-24 06:36:44.134055: step: 1452/530, loss: 0.02849707566201687 2023-01-24 06:36:45.178259: step: 1456/530, loss: 0.004898302257061005 2023-01-24 06:36:46.219700: step: 1460/530, loss: 0.010679779574275017 2023-01-24 06:36:47.254394: step: 1464/530, loss: 0.007697803433984518 2023-01-24 06:36:48.294685: step: 1468/530, loss: 0.0028260282706469297 2023-01-24 06:36:49.330837: step: 1472/530, loss: 0.006924837362021208 2023-01-24 06:36:50.372866: step: 1476/530, loss: 0.015142632648348808 2023-01-24 06:36:51.418898: step: 1480/530, loss: 0.0008756800089031458 2023-01-24 06:36:52.466283: step: 1484/530, loss: 0.013374381698668003 2023-01-24 06:36:53.509647: step: 1488/530, loss: 0.005547772627323866 2023-01-24 06:36:54.545934: step: 1492/530, loss: 0.00014117249520495534 2023-01-24 06:36:55.598653: step: 1496/530, loss: 0.09097698330879211 2023-01-24 06:36:56.648575: step: 1500/530, loss: 0.004561661276966333 2023-01-24 06:36:57.690910: step: 1504/530, loss: 0.005302931182086468 2023-01-24 06:36:58.724012: step: 1508/530, loss: 0.00365307554602623 2023-01-24 06:36:59.774650: step: 1512/530, loss: 0.004533231258392334 2023-01-24 06:37:00.794961: step: 1516/530, loss: 0.0005154838436283171 2023-01-24 06:37:01.866056: step: 1520/530, loss: 0.0012163642095401883 2023-01-24 06:37:02.928904: step: 1524/530, loss: 0.010871480219066143 2023-01-24 06:37:03.954212: step: 1528/530, loss: 0.004683495499193668 2023-01-24 06:37:04.992521: step: 1532/530, loss: 0.006208150181919336 2023-01-24 06:37:06.039753: step: 1536/530, loss: 0.026776233687996864 2023-01-24 06:37:07.071485: step: 1540/530, loss: 0.008641284890472889 2023-01-24 06:37:08.122989: step: 1544/530, loss: 0.0034048634115606546 2023-01-24 06:37:09.161946: step: 1548/530, loss: 0.0019314669771119952 2023-01-24 06:37:10.200539: step: 1552/530, loss: 0.01194714568555355 2023-01-24 06:37:11.242002: step: 1556/530, loss: 0.004168049432337284 2023-01-24 06:37:12.282198: step: 1560/530, loss: 0.010259849950671196 2023-01-24 06:37:13.340731: step: 1564/530, loss: 0.002234025625512004 2023-01-24 06:37:14.387217: step: 1568/530, loss: 0.004801113158464432 2023-01-24 06:37:15.428684: step: 1572/530, loss: 0.009865065105259418 2023-01-24 06:37:16.468270: step: 1576/530, loss: 0.02490215189754963 2023-01-24 06:37:17.517224: step: 1580/530, loss: 0.004020696971565485 2023-01-24 06:37:18.569739: step: 1584/530, loss: 0.004061207640916109 2023-01-24 06:37:19.625715: step: 1588/530, loss: 0.007300190627574921 2023-01-24 06:37:20.685026: step: 1592/530, loss: 0.007340441923588514 2023-01-24 06:37:21.741405: step: 1596/530, loss: 0.019605109468102455 2023-01-24 06:37:22.792287: step: 1600/530, loss: 0.007271318696439266 2023-01-24 06:37:23.844102: step: 1604/530, loss: 0.0002542764414101839 2023-01-24 06:37:24.873689: step: 1608/530, loss: 8.247878577094525e-05 2023-01-24 06:37:25.915054: step: 1612/530, loss: 0.002961857244372368 2023-01-24 06:37:26.964252: step: 1616/530, loss: 0.002005236456170678 2023-01-24 06:37:28.008979: step: 1620/530, loss: 0.03412347286939621 2023-01-24 06:37:29.046075: step: 1624/530, loss: 0.005694087594747543 2023-01-24 06:37:30.071578: step: 1628/530, loss: 0.002938526216894388 2023-01-24 06:37:31.121857: step: 1632/530, loss: 0.0035656930413097143 2023-01-24 06:37:32.167823: step: 1636/530, loss: 0.007496458012610674 2023-01-24 06:37:33.226706: step: 1640/530, loss: 0.015275801531970501 2023-01-24 06:37:34.263450: step: 1644/530, loss: 0.00030952124507166445 2023-01-24 06:37:35.320111: step: 1648/530, loss: 0.0016049513360485435 2023-01-24 06:37:36.399239: step: 1652/530, loss: 0.06627373397350311 2023-01-24 06:37:37.458935: step: 1656/530, loss: 0.004653996787965298 2023-01-24 06:37:38.519230: step: 1660/530, loss: 0.01616736687719822 2023-01-24 06:37:39.582223: step: 1664/530, loss: 0.004366998095065355 2023-01-24 06:37:40.631543: step: 1668/530, loss: 0.020630398765206337 2023-01-24 06:37:41.678809: step: 1672/530, loss: 0.008225682191550732 2023-01-24 06:37:42.728489: step: 1676/530, loss: 0.005981991998851299 2023-01-24 06:37:43.771501: step: 1680/530, loss: 0.019214877858757973 2023-01-24 06:37:44.813445: step: 1684/530, loss: 0.004969678353518248 2023-01-24 06:37:45.858756: step: 1688/530, loss: 0.01868354342877865 2023-01-24 06:37:46.906528: step: 1692/530, loss: 0.002672115806490183 2023-01-24 06:37:47.963883: step: 1696/530, loss: 0.03800823539495468 2023-01-24 06:37:49.001060: step: 1700/530, loss: 0.010799265466630459 2023-01-24 06:37:50.052717: step: 1704/530, loss: 0.02098977006971836 2023-01-24 06:37:51.102424: step: 1708/530, loss: 0.004991845693439245 2023-01-24 06:37:52.147474: step: 1712/530, loss: 0.0561748743057251 2023-01-24 06:37:53.190859: step: 1716/530, loss: 0.0015178319299593568 2023-01-24 06:37:54.230561: step: 1720/530, loss: 0.002624554792419076 2023-01-24 06:37:55.296147: step: 1724/530, loss: 0.0014093922218307853 2023-01-24 06:37:56.341394: step: 1728/530, loss: 0.004691623616963625 2023-01-24 06:37:57.389022: step: 1732/530, loss: 0.0004925410030409694 2023-01-24 06:37:58.430228: step: 1736/530, loss: 0.05746084824204445 2023-01-24 06:37:59.469977: step: 1740/530, loss: 0.0037279885727912188 2023-01-24 06:38:00.511852: step: 1744/530, loss: 0.003784911008551717 2023-01-24 06:38:01.563653: step: 1748/530, loss: 0.0002881013788282871 2023-01-24 06:38:02.602542: step: 1752/530, loss: 0.012532379478216171 2023-01-24 06:38:03.643845: step: 1756/530, loss: 0.0021440708078444004 2023-01-24 06:38:04.679062: step: 1760/530, loss: 0.0002058007230516523 2023-01-24 06:38:05.715926: step: 1764/530, loss: 0.0006012417725287378 2023-01-24 06:38:06.756102: step: 1768/530, loss: 0.0016347682103514671 2023-01-24 06:38:07.799387: step: 1772/530, loss: 0.003658115165308118 2023-01-24 06:38:08.833880: step: 1776/530, loss: 0.004269181285053492 2023-01-24 06:38:09.890372: step: 1780/530, loss: 0.00791000947356224 2023-01-24 06:38:10.950212: step: 1784/530, loss: 0.026806047186255455 2023-01-24 06:38:11.976447: step: 1788/530, loss: 0.00948000606149435 2023-01-24 06:38:13.028273: step: 1792/530, loss: 0.011920362710952759 2023-01-24 06:38:14.065569: step: 1796/530, loss: 0.03282766789197922 2023-01-24 06:38:15.118168: step: 1800/530, loss: 0.000908299523871392 2023-01-24 06:38:16.176741: step: 1804/530, loss: 0.0018953416729345918 2023-01-24 06:38:17.214202: step: 1808/530, loss: 0.005275444593280554 2023-01-24 06:38:18.257710: step: 1812/530, loss: 0.008262324146926403 2023-01-24 06:38:19.311126: step: 1816/530, loss: 0.0015323427505791187 2023-01-24 06:38:20.383265: step: 1820/530, loss: 0.004005383234471083 2023-01-24 06:38:21.425887: step: 1824/530, loss: 0.0029299065936356783 2023-01-24 06:38:22.464912: step: 1828/530, loss: 0.0006123905768617988 2023-01-24 06:38:23.509386: step: 1832/530, loss: 0.006294749211519957 2023-01-24 06:38:24.553243: step: 1836/530, loss: 0.006262174341827631 2023-01-24 06:38:25.608524: step: 1840/530, loss: 0.005474178120493889 2023-01-24 06:38:26.648634: step: 1844/530, loss: 0.007734323851764202 2023-01-24 06:38:27.690819: step: 1848/530, loss: 0.017927972599864006 2023-01-24 06:38:28.731157: step: 1852/530, loss: 0.01759951189160347 2023-01-24 06:38:29.799971: step: 1856/530, loss: 0.0019120501819998026 2023-01-24 06:38:30.836958: step: 1860/530, loss: 0.01430408377200365 2023-01-24 06:38:31.864907: step: 1864/530, loss: 0.008443888276815414 2023-01-24 06:38:32.936498: step: 1868/530, loss: 0.029394129291176796 2023-01-24 06:38:33.963791: step: 1872/530, loss: 0.005415191873908043 2023-01-24 06:38:34.991527: step: 1876/530, loss: 0.002877107122913003 2023-01-24 06:38:36.027537: step: 1880/530, loss: 0.01959078013896942 2023-01-24 06:38:37.071034: step: 1884/530, loss: 0.0007007047533988953 2023-01-24 06:38:38.104346: step: 1888/530, loss: 0.024128485471010208 2023-01-24 06:38:39.142108: step: 1892/530, loss: 0.006385908927768469 2023-01-24 06:38:40.188937: step: 1896/530, loss: 0.0003817017131950706 2023-01-24 06:38:41.249647: step: 1900/530, loss: 0.045657165348529816 2023-01-24 06:38:42.291294: step: 1904/530, loss: 0.004568448755890131 2023-01-24 06:38:43.317546: step: 1908/530, loss: 0.00264281895942986 2023-01-24 06:38:44.366616: step: 1912/530, loss: 0.0071998341009020805 2023-01-24 06:38:45.411154: step: 1916/530, loss: 0.001907242345623672 2023-01-24 06:38:46.453591: step: 1920/530, loss: 0.01005789265036583 2023-01-24 06:38:47.492068: step: 1924/530, loss: 0.011069388128817081 2023-01-24 06:38:48.532449: step: 1928/530, loss: 0.00021996225405018777 2023-01-24 06:38:49.570526: step: 1932/530, loss: 0.0023647595662623644 2023-01-24 06:38:50.610497: step: 1936/530, loss: 0.034565169364213943 2023-01-24 06:38:51.645490: step: 1940/530, loss: 0.00128383026458323 2023-01-24 06:38:52.690574: step: 1944/530, loss: 0.003384356154128909 2023-01-24 06:38:53.744072: step: 1948/530, loss: 0.0057662129402160645 2023-01-24 06:38:54.796471: step: 1952/530, loss: 0.004734586924314499 2023-01-24 06:38:55.835534: step: 1956/530, loss: 0.0028805905021727085 2023-01-24 06:38:56.885318: step: 1960/530, loss: 0.005686209537088871 2023-01-24 06:38:57.913994: step: 1964/530, loss: 0.07512509077787399 2023-01-24 06:38:58.963904: step: 1968/530, loss: 0.007569109555333853 2023-01-24 06:39:00.000579: step: 1972/530, loss: 0.011002618819475174 2023-01-24 06:39:01.045436: step: 1976/530, loss: 0.0035132223274558783 2023-01-24 06:39:02.073730: step: 1980/530, loss: 0.005859080236405134 2023-01-24 06:39:03.131239: step: 1984/530, loss: 0.013466530479490757 2023-01-24 06:39:04.173263: step: 1988/530, loss: 0.015540882013738155 2023-01-24 06:39:05.233655: step: 1992/530, loss: 0.015781747177243233 2023-01-24 06:39:06.281587: step: 1996/530, loss: 0.014215042814612389 2023-01-24 06:39:07.331609: step: 2000/530, loss: 0.018209019675850868 2023-01-24 06:39:08.374367: step: 2004/530, loss: 0.004298359155654907 2023-01-24 06:39:09.414225: step: 2008/530, loss: 0.003188485512509942 2023-01-24 06:39:10.456770: step: 2012/530, loss: 0.0033658568281680346 2023-01-24 06:39:11.497017: step: 2016/530, loss: 0.005697112064808607 2023-01-24 06:39:12.529654: step: 2020/530, loss: 0.0010083907982334495 2023-01-24 06:39:13.572253: step: 2024/530, loss: 0.0069275605492293835 2023-01-24 06:39:14.613978: step: 2028/530, loss: 0.009948932565748692 2023-01-24 06:39:15.649088: step: 2032/530, loss: 0.007743677590042353 2023-01-24 06:39:16.697866: step: 2036/530, loss: 0.0029076864011585712 2023-01-24 06:39:17.755217: step: 2040/530, loss: 0.0050680204294621944 2023-01-24 06:39:18.793303: step: 2044/530, loss: 0.002660448430106044 2023-01-24 06:39:19.846645: step: 2048/530, loss: 0.019445575773715973 2023-01-24 06:39:20.887815: step: 2052/530, loss: 0.0033525116741657257 2023-01-24 06:39:21.930652: step: 2056/530, loss: 0.009775001555681229 2023-01-24 06:39:22.963511: step: 2060/530, loss: 0.00822951178997755 2023-01-24 06:39:23.995972: step: 2064/530, loss: 0.03787067160010338 2023-01-24 06:39:25.031400: step: 2068/530, loss: 0.008486567065119743 2023-01-24 06:39:26.085540: step: 2072/530, loss: 0.02640714682638645 2023-01-24 06:39:27.125855: step: 2076/530, loss: 0.003663779702037573 2023-01-24 06:39:28.184467: step: 2080/530, loss: 0.023887792602181435 2023-01-24 06:39:29.254264: step: 2084/530, loss: 0.004308950621634722 2023-01-24 06:39:30.291762: step: 2088/530, loss: 0.005090512800961733 2023-01-24 06:39:31.341504: step: 2092/530, loss: 0.004757900722324848 2023-01-24 06:39:32.396223: step: 2096/530, loss: 0.017214633524417877 2023-01-24 06:39:33.435802: step: 2100/530, loss: 0.0040232776664197445 2023-01-24 06:39:34.477643: step: 2104/530, loss: 0.018518147990107536 2023-01-24 06:39:35.530328: step: 2108/530, loss: 0.0037364864256232977 2023-01-24 06:39:36.593923: step: 2112/530, loss: 0.016615334898233414 2023-01-24 06:39:37.647795: step: 2116/530, loss: 0.04572223871946335 2023-01-24 06:39:38.675766: step: 2120/530, loss: 0.0041249594651162624 ================================================== Loss: 0.009 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37509743875278395, 'r': 0.3195801707779886, 'f1': 0.3451203893442623}, 'combined': 0.25429923425366696, 'stategy': 1, 'epoch': 8} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37477309194500474, 'r': 0.38889597500543227, 'f1': 0.38170394299134897}, 'combined': 0.295866214184682, 'stategy': 1, 'epoch': 8} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3953728281853282, 'r': 0.33310348332881545, 'f1': 0.3615767985876122}, 'combined': 0.266425009485609, 'stategy': 1, 'epoch': 8} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37187421934722487, 'r': 0.36777266545736575, 'f1': 0.3698120702565748}, 'combined': 0.28664859034241685, 'stategy': 1, 'epoch': 8} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 8} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 8} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 9 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 06:42:12.856131: step: 4/530, loss: 0.0006209381972439587 2023-01-24 06:42:13.901490: step: 8/530, loss: 0.005409138277173042 2023-01-24 06:42:14.925685: step: 12/530, loss: 0.0015448397025465965 2023-01-24 06:42:15.965709: step: 16/530, loss: 0.010289283469319344 2023-01-24 06:42:17.004582: step: 20/530, loss: 0.0035234715323895216 2023-01-24 06:42:18.044061: step: 24/530, loss: 0.0014163681771606207 2023-01-24 06:42:19.072933: step: 28/530, loss: 0.0028939873445779085 2023-01-24 06:42:20.116645: step: 32/530, loss: 0.00071155303157866 2023-01-24 06:42:21.172994: step: 36/530, loss: 0.0013890970731154084 2023-01-24 06:42:22.214678: step: 40/530, loss: 0.01129063218832016 2023-01-24 06:42:23.249450: step: 44/530, loss: 0.008677608333528042 2023-01-24 06:42:24.283560: step: 48/530, loss: 0.003512483322992921 2023-01-24 06:42:25.337155: step: 52/530, loss: 0.007468697149306536 2023-01-24 06:42:26.372635: step: 56/530, loss: 0.0032410991843789816 2023-01-24 06:42:27.409836: step: 60/530, loss: 0.005233378149569035 2023-01-24 06:42:28.433706: step: 64/530, loss: 0.0013106934493407607 2023-01-24 06:42:29.465642: step: 68/530, loss: 0.002669335575774312 2023-01-24 06:42:30.501470: step: 72/530, loss: 0.009931476786732674 2023-01-24 06:42:31.545805: step: 76/530, loss: 0.008454172872006893 2023-01-24 06:42:32.589175: step: 80/530, loss: 0.0012372930068522692 2023-01-24 06:42:33.644455: step: 84/530, loss: 0.006941849831491709 2023-01-24 06:42:34.671533: step: 88/530, loss: 0.003480770858004689 2023-01-24 06:42:35.719976: step: 92/530, loss: 0.003321863943710923 2023-01-24 06:42:36.773809: step: 96/530, loss: 0.006346917245537043 2023-01-24 06:42:37.821967: step: 100/530, loss: 0.004151160828769207 2023-01-24 06:42:38.861160: step: 104/530, loss: 0.010191456414759159 2023-01-24 06:42:39.904012: step: 108/530, loss: 0.00170665024779737 2023-01-24 06:42:40.939685: step: 112/530, loss: 0.010996382683515549 2023-01-24 06:42:41.981473: step: 116/530, loss: 0.005379866808652878 2023-01-24 06:42:43.023358: step: 120/530, loss: 0.013132884167134762 2023-01-24 06:42:44.064621: step: 124/530, loss: 0.002991231856867671 2023-01-24 06:42:45.099978: step: 128/530, loss: 0.005615054629743099 2023-01-24 06:42:46.144019: step: 132/530, loss: 0.0002714320144150406 2023-01-24 06:42:47.189131: step: 136/530, loss: 0.0022933476138859987 2023-01-24 06:42:48.246728: step: 140/530, loss: 0.010669552721083164 2023-01-24 06:42:49.296176: step: 144/530, loss: 0.0037675295025110245 2023-01-24 06:42:50.343799: step: 148/530, loss: 0.009470069780945778 2023-01-24 06:42:51.369510: step: 152/530, loss: 0.0024332383181899786 2023-01-24 06:42:52.408882: step: 156/530, loss: 0.0005654859123751521 2023-01-24 06:42:53.455109: step: 160/530, loss: 0.005316976923495531 2023-01-24 06:42:54.505217: step: 164/530, loss: 0.0028190724551677704 2023-01-24 06:42:55.547298: step: 168/530, loss: 0.018861649557948112 2023-01-24 06:42:56.584956: step: 172/530, loss: 0.004665170796215534 2023-01-24 06:42:57.626143: step: 176/530, loss: 0.006975051015615463 2023-01-24 06:42:58.681580: step: 180/530, loss: 0.005266045220196247 2023-01-24 06:42:59.716469: step: 184/530, loss: 0.0073999869637191296 2023-01-24 06:43:00.760431: step: 188/530, loss: 0.005271570757031441 2023-01-24 06:43:01.794169: step: 192/530, loss: 0.0040196911431849 2023-01-24 06:43:02.848749: step: 196/530, loss: 0.0050012799911201 2023-01-24 06:43:03.897963: step: 200/530, loss: 0.009146283380687237 2023-01-24 06:43:04.961905: step: 204/530, loss: 0.0016826997743919492 2023-01-24 06:43:06.013760: step: 208/530, loss: 0.0018508293433114886 2023-01-24 06:43:07.065012: step: 212/530, loss: 0.002263486385345459 2023-01-24 06:43:08.119203: step: 216/530, loss: 0.003722940571606159 2023-01-24 06:43:09.153902: step: 220/530, loss: 0.004396012052893639 2023-01-24 06:43:10.194811: step: 224/530, loss: 0.0007305858307518065 2023-01-24 06:43:11.233958: step: 228/530, loss: 0.0157123152166605 2023-01-24 06:43:12.268256: step: 232/530, loss: 0.002254583640024066 2023-01-24 06:43:13.327462: step: 236/530, loss: 0.02397082932293415 2023-01-24 06:43:14.372120: step: 240/530, loss: 0.0029040116351097822 2023-01-24 06:43:15.421883: step: 244/530, loss: 0.002293383004143834 2023-01-24 06:43:16.461904: step: 248/530, loss: 0.0024760798551142216 2023-01-24 06:43:17.503263: step: 252/530, loss: 0.0003948241355828941 2023-01-24 06:43:18.537155: step: 256/530, loss: 0.005318681709468365 2023-01-24 06:43:19.571821: step: 260/530, loss: 0.003933188039809465 2023-01-24 06:43:20.612495: step: 264/530, loss: 0.0022918349131941795 2023-01-24 06:43:21.667061: step: 268/530, loss: 0.001917347894050181 2023-01-24 06:43:22.729691: step: 272/530, loss: 0.008362486027181149 2023-01-24 06:43:23.779039: step: 276/530, loss: 0.003461591899394989 2023-01-24 06:43:24.841900: step: 280/530, loss: 0.014286975376307964 2023-01-24 06:43:25.890742: step: 284/530, loss: 0.005234415177255869 2023-01-24 06:43:26.927107: step: 288/530, loss: 0.006149015389382839 2023-01-24 06:43:27.970423: step: 292/530, loss: 0.008718025870621204 2023-01-24 06:43:29.029354: step: 296/530, loss: 0.003898176597431302 2023-01-24 06:43:30.062653: step: 300/530, loss: 0.004752518143504858 2023-01-24 06:43:31.104181: step: 304/530, loss: 0.00403517996892333 2023-01-24 06:43:32.152374: step: 308/530, loss: 0.002216941677033901 2023-01-24 06:43:33.230363: step: 312/530, loss: 0.01114710420370102 2023-01-24 06:43:34.289286: step: 316/530, loss: 0.0022061492782086134 2023-01-24 06:43:35.344458: step: 320/530, loss: 0.0073404936119914055 2023-01-24 06:43:36.384610: step: 324/530, loss: 0.0035091866739094257 2023-01-24 06:43:37.434755: step: 328/530, loss: 0.007213753182440996 2023-01-24 06:43:38.487481: step: 332/530, loss: 0.0007382984622381628 2023-01-24 06:43:39.529512: step: 336/530, loss: 0.002657539676874876 2023-01-24 06:43:40.596916: step: 340/530, loss: 0.015084072947502136 2023-01-24 06:43:41.646979: step: 344/530, loss: 0.002511706668883562 2023-01-24 06:43:42.682510: step: 348/530, loss: 0.008695260621607304 2023-01-24 06:43:43.745078: step: 352/530, loss: 0.0001467554538976401 2023-01-24 06:43:44.785148: step: 356/530, loss: 0.002057208912447095 2023-01-24 06:43:45.820179: step: 360/530, loss: 0.00023294858692679554 2023-01-24 06:43:46.859167: step: 364/530, loss: 0.003144181100651622 2023-01-24 06:43:47.917846: step: 368/530, loss: 0.001276860828511417 2023-01-24 06:43:48.970584: step: 372/530, loss: 0.0028216044884175062 2023-01-24 06:43:50.015734: step: 376/530, loss: 0.010744867846369743 2023-01-24 06:43:51.060801: step: 380/530, loss: 0.012082196772098541 2023-01-24 06:43:52.123821: step: 384/530, loss: 0.01160083245486021 2023-01-24 06:43:53.186000: step: 388/530, loss: 0.004039873369038105 2023-01-24 06:43:54.235446: step: 392/530, loss: 0.002372811082750559 2023-01-24 06:43:55.258463: step: 396/530, loss: 0.0052165803499519825 2023-01-24 06:43:56.311913: step: 400/530, loss: 0.010901889763772488 2023-01-24 06:43:57.373181: step: 404/530, loss: 7.632553024450317e-05 2023-01-24 06:43:58.425385: step: 408/530, loss: 0.007905535399913788 2023-01-24 06:43:59.459510: step: 412/530, loss: 0.023107746616005898 2023-01-24 06:44:00.518297: step: 416/530, loss: 0.004115113522857428 2023-01-24 06:44:01.557892: step: 420/530, loss: 0.005026670638471842 2023-01-24 06:44:02.597888: step: 424/530, loss: 0.0001979036896955222 2023-01-24 06:44:03.642209: step: 428/530, loss: 2.4248825866379775e-05 2023-01-24 06:44:04.686698: step: 432/530, loss: 0.003198995254933834 2023-01-24 06:44:05.733558: step: 436/530, loss: 0.006178115028887987 2023-01-24 06:44:06.788649: step: 440/530, loss: 0.013625619001686573 2023-01-24 06:44:07.829314: step: 444/530, loss: 0.012171263806521893 2023-01-24 06:44:08.860249: step: 448/530, loss: 0.0010392614640295506 2023-01-24 06:44:09.890635: step: 452/530, loss: 0.00856825988739729 2023-01-24 06:44:10.932208: step: 456/530, loss: 0.0022253484930843115 2023-01-24 06:44:11.983987: step: 460/530, loss: 5.9952533774776384e-05 2023-01-24 06:44:13.039273: step: 464/530, loss: 0.00378594477660954 2023-01-24 06:44:14.079512: step: 468/530, loss: 0.002749522915109992 2023-01-24 06:44:15.122974: step: 472/530, loss: 4.452800203580409e-05 2023-01-24 06:44:16.175921: step: 476/530, loss: 0.039248015731573105 2023-01-24 06:44:17.224169: step: 480/530, loss: 0.0035848915576934814 2023-01-24 06:44:18.272616: step: 484/530, loss: 0.010259442962706089 2023-01-24 06:44:19.313014: step: 488/530, loss: 0.0048105353489518166 2023-01-24 06:44:20.360848: step: 492/530, loss: 0.00436235498636961 2023-01-24 06:44:21.397534: step: 496/530, loss: 0.006622565444558859 2023-01-24 06:44:22.453108: step: 500/530, loss: 0.007045813370496035 2023-01-24 06:44:23.508925: step: 504/530, loss: 0.013757947832345963 2023-01-24 06:44:24.563582: step: 508/530, loss: 0.0018067141063511372 2023-01-24 06:44:25.595406: step: 512/530, loss: 0.0005818530917167664 2023-01-24 06:44:26.635006: step: 516/530, loss: 4.2711140849860385e-05 2023-01-24 06:44:27.677984: step: 520/530, loss: 0.0030087523628026247 2023-01-24 06:44:28.726009: step: 524/530, loss: 0.011717578396201134 2023-01-24 06:44:29.775463: step: 528/530, loss: 0.004926319234073162 2023-01-24 06:44:30.811090: step: 532/530, loss: 0.005543484352529049 2023-01-24 06:44:31.850723: step: 536/530, loss: 0.0037364745512604713 2023-01-24 06:44:32.892170: step: 540/530, loss: 0.012873668223619461 2023-01-24 06:44:33.947886: step: 544/530, loss: 0.0017886903369799256 2023-01-24 06:44:34.997220: step: 548/530, loss: 0.0009586654487065971 2023-01-24 06:44:36.044993: step: 552/530, loss: 0.00022563175298273563 2023-01-24 06:44:37.078783: step: 556/530, loss: 0.001532841706648469 2023-01-24 06:44:38.124965: step: 560/530, loss: 0.002271534875035286 2023-01-24 06:44:39.175611: step: 564/530, loss: 0.0018010871717706323 2023-01-24 06:44:40.226684: step: 568/530, loss: 0.0018214972224086523 2023-01-24 06:44:41.278426: step: 572/530, loss: 0.010475671850144863 2023-01-24 06:44:42.322766: step: 576/530, loss: 0.0017840828513726592 2023-01-24 06:44:43.363371: step: 580/530, loss: 0.0007851749542169273 2023-01-24 06:44:44.399966: step: 584/530, loss: 0.010895797982811928 2023-01-24 06:44:45.471321: step: 588/530, loss: 0.0010575465857982635 2023-01-24 06:44:46.511204: step: 592/530, loss: 0.0058981976471841335 2023-01-24 06:44:47.555674: step: 596/530, loss: 0.009622196666896343 2023-01-24 06:44:48.584060: step: 600/530, loss: 0.005134582985192537 2023-01-24 06:44:49.645416: step: 604/530, loss: 0.01785311847925186 2023-01-24 06:44:50.680027: step: 608/530, loss: 0.004243937321007252 2023-01-24 06:44:51.723413: step: 612/530, loss: 0.0037687995936721563 2023-01-24 06:44:52.781256: step: 616/530, loss: 0.008864447474479675 2023-01-24 06:44:53.828794: step: 620/530, loss: 0.002821667119860649 2023-01-24 06:44:54.875800: step: 624/530, loss: 0.009178198873996735 2023-01-24 06:44:55.919705: step: 628/530, loss: 0.0051460848189890385 2023-01-24 06:44:56.970972: step: 632/530, loss: 0.002938908291980624 2023-01-24 06:44:58.011614: step: 636/530, loss: 0.0010824577184394002 2023-01-24 06:44:59.065574: step: 640/530, loss: 0.0030520702712237835 2023-01-24 06:45:00.126139: step: 644/530, loss: 0.005224923603236675 2023-01-24 06:45:01.175902: step: 648/530, loss: 0.0032114519271999598 2023-01-24 06:45:02.228097: step: 652/530, loss: 0.0025177313946187496 2023-01-24 06:45:03.267212: step: 656/530, loss: 0.003136696759611368 2023-01-24 06:45:04.294081: step: 660/530, loss: 0.010835128836333752 2023-01-24 06:45:05.324005: step: 664/530, loss: 0.000787380849942565 2023-01-24 06:45:06.358722: step: 668/530, loss: 0.0014537522802129388 2023-01-24 06:45:07.395585: step: 672/530, loss: 1.820558827603236e-05 2023-01-24 06:45:08.448251: step: 676/530, loss: 0.026104798540472984 2023-01-24 06:45:09.476696: step: 680/530, loss: 0.0033932935912162066 2023-01-24 06:45:10.523760: step: 684/530, loss: 0.0176799725741148 2023-01-24 06:45:11.572007: step: 688/530, loss: 0.0019636424258351326 2023-01-24 06:45:12.638294: step: 692/530, loss: 0.0056401388719677925 2023-01-24 06:45:13.691434: step: 696/530, loss: 0.0040038335137069225 2023-01-24 06:45:14.734699: step: 700/530, loss: 0.00013681819837074727 2023-01-24 06:45:15.789543: step: 704/530, loss: 0.005105760879814625 2023-01-24 06:45:16.835530: step: 708/530, loss: 0.0054229130037128925 2023-01-24 06:45:17.875096: step: 712/530, loss: 0.010855082422494888 2023-01-24 06:45:18.915142: step: 716/530, loss: 0.0009179575135931373 2023-01-24 06:45:19.958441: step: 720/530, loss: 0.003498739330098033 2023-01-24 06:45:21.010691: step: 724/530, loss: 0.03850526362657547 2023-01-24 06:45:22.051213: step: 728/530, loss: 0.0026494988705962896 2023-01-24 06:45:23.100851: step: 732/530, loss: 0.004396180156618357 2023-01-24 06:45:24.158761: step: 736/530, loss: 0.004936248064041138 2023-01-24 06:45:25.207601: step: 740/530, loss: 0.041989538818597794 2023-01-24 06:45:26.245120: step: 744/530, loss: 0.00226575112901628 2023-01-24 06:45:27.289354: step: 748/530, loss: 0.003907649777829647 2023-01-24 06:45:28.371145: step: 752/530, loss: 0.006387569475919008 2023-01-24 06:45:29.431310: step: 756/530, loss: 0.001551038702018559 2023-01-24 06:45:30.483940: step: 760/530, loss: 0.0010991533054038882 2023-01-24 06:45:31.517793: step: 764/530, loss: 0.0021354707423597574 2023-01-24 06:45:32.560237: step: 768/530, loss: 0.0043305279687047005 2023-01-24 06:45:33.617893: step: 772/530, loss: 0.0020844945684075356 2023-01-24 06:45:34.681573: step: 776/530, loss: 0.00469202222302556 2023-01-24 06:45:35.731074: step: 780/530, loss: 0.0034021888859570026 2023-01-24 06:45:36.759293: step: 784/530, loss: 0.0017556928796693683 2023-01-24 06:45:37.808190: step: 788/530, loss: 0.0032824957743287086 2023-01-24 06:45:38.865104: step: 792/530, loss: 0.010158962570130825 2023-01-24 06:45:39.906127: step: 796/530, loss: 0.007878285832703114 2023-01-24 06:45:40.958300: step: 800/530, loss: 0.004742312710732222 2023-01-24 06:45:42.005690: step: 804/530, loss: 0.009991863742470741 2023-01-24 06:45:43.041302: step: 808/530, loss: 0.0013612674083560705 2023-01-24 06:45:44.087974: step: 812/530, loss: 0.0015850623603910208 2023-01-24 06:45:45.143636: step: 816/530, loss: 0.002510854508727789 2023-01-24 06:45:46.178148: step: 820/530, loss: 2.8556860343087465e-05 2023-01-24 06:45:47.218011: step: 824/530, loss: 0.015842730179429054 2023-01-24 06:45:48.264981: step: 828/530, loss: 0.00478518707677722 2023-01-24 06:45:49.297355: step: 832/530, loss: 0.0014124192530289292 2023-01-24 06:45:50.373225: step: 836/530, loss: 0.0008071013726294041 2023-01-24 06:45:51.423835: step: 840/530, loss: 0.0035026699770241976 2023-01-24 06:45:52.477665: step: 844/530, loss: 0.006822494324296713 2023-01-24 06:45:53.527377: step: 848/530, loss: 0.002910975832492113 2023-01-24 06:45:54.567317: step: 852/530, loss: 0.007475380785763264 2023-01-24 06:45:55.609295: step: 856/530, loss: 0.009072045795619488 2023-01-24 06:45:56.654378: step: 860/530, loss: 0.002773278160020709 2023-01-24 06:45:57.697216: step: 864/530, loss: 0.01841503381729126 2023-01-24 06:45:58.729430: step: 868/530, loss: 0.0025660002138465643 2023-01-24 06:45:59.770686: step: 872/530, loss: 0.0016632447950541973 2023-01-24 06:46:00.812979: step: 876/530, loss: 0.008733168244361877 2023-01-24 06:46:01.841195: step: 880/530, loss: 0.0022561594378203154 2023-01-24 06:46:02.868170: step: 884/530, loss: 0.007295619696378708 2023-01-24 06:46:03.926556: step: 888/530, loss: 0.0019046009983867407 2023-01-24 06:46:04.981572: step: 892/530, loss: 0.021429788321256638 2023-01-24 06:46:06.009449: step: 896/530, loss: 0.004059345927089453 2023-01-24 06:46:07.052678: step: 900/530, loss: 0.023798787966370583 2023-01-24 06:46:08.098217: step: 904/530, loss: 0.00261833518743515 2023-01-24 06:46:09.127548: step: 908/530, loss: 0.005177017766982317 2023-01-24 06:46:10.163656: step: 912/530, loss: 0.0010973135940730572 2023-01-24 06:46:11.216977: step: 916/530, loss: 0.003613788168877363 2023-01-24 06:46:12.272148: step: 920/530, loss: 0.003889397718012333 2023-01-24 06:46:13.319081: step: 924/530, loss: 0.010057389736175537 2023-01-24 06:46:14.369704: step: 928/530, loss: 0.0015708347782492638 2023-01-24 06:46:15.419326: step: 932/530, loss: 0.007073408458381891 2023-01-24 06:46:16.468439: step: 936/530, loss: 0.0020177685655653477 2023-01-24 06:46:17.508435: step: 940/530, loss: 0.05060373619198799 2023-01-24 06:46:18.556659: step: 944/530, loss: 0.002321278676390648 2023-01-24 06:46:19.594220: step: 948/530, loss: 0.001859754789620638 2023-01-24 06:46:20.625854: step: 952/530, loss: 0.0010469758417457342 2023-01-24 06:46:21.654692: step: 956/530, loss: 0.00036462058778852224 2023-01-24 06:46:22.717665: step: 960/530, loss: 0.004063926171511412 2023-01-24 06:46:23.750135: step: 964/530, loss: 0.0006449102656915784 2023-01-24 06:46:24.802808: step: 968/530, loss: 0.04210960492491722 2023-01-24 06:46:25.855995: step: 972/530, loss: 0.011882578022778034 2023-01-24 06:46:26.907261: step: 976/530, loss: 0.004899441264569759 2023-01-24 06:46:27.960250: step: 980/530, loss: 0.00011892046313732862 2023-01-24 06:46:29.012069: step: 984/530, loss: 0.0013491458958014846 2023-01-24 06:46:30.071805: step: 988/530, loss: 0.00580895971506834 2023-01-24 06:46:31.110711: step: 992/530, loss: 0.0039952704682946205 2023-01-24 06:46:32.177680: step: 996/530, loss: 0.006136264652013779 2023-01-24 06:46:33.201082: step: 1000/530, loss: 0.0034204628318548203 2023-01-24 06:46:34.240140: step: 1004/530, loss: 0.008623231202363968 2023-01-24 06:46:35.280485: step: 1008/530, loss: 0.0007546083070337772 2023-01-24 06:46:36.323711: step: 1012/530, loss: 0.009424910880625248 2023-01-24 06:46:37.364428: step: 1016/530, loss: 0.006336224731057882 2023-01-24 06:46:38.442140: step: 1020/530, loss: 0.01862392947077751 2023-01-24 06:46:39.488413: step: 1024/530, loss: 0.003281189827248454 2023-01-24 06:46:40.515253: step: 1028/530, loss: 0.002109914319589734 2023-01-24 06:46:41.554683: step: 1032/530, loss: 0.0030730459839105606 2023-01-24 06:46:42.618242: step: 1036/530, loss: 0.005453116726130247 2023-01-24 06:46:43.661310: step: 1040/530, loss: 0.0020153226796537638 2023-01-24 06:46:44.682352: step: 1044/530, loss: 0.0016653892816975713 2023-01-24 06:46:45.743712: step: 1048/530, loss: 0.00027228944236412644 2023-01-24 06:46:46.793633: step: 1052/530, loss: 0.0072599113918840885 2023-01-24 06:46:47.837051: step: 1056/530, loss: 0.0001541073725093156 2023-01-24 06:46:48.883019: step: 1060/530, loss: 0.001273548579774797 2023-01-24 06:46:49.930316: step: 1064/530, loss: 0.0017354830633848906 2023-01-24 06:46:50.972776: step: 1068/530, loss: 0.007379298098385334 2023-01-24 06:46:52.025287: step: 1072/530, loss: 0.007031646091490984 2023-01-24 06:46:53.087134: step: 1076/530, loss: 0.006455523893237114 2023-01-24 06:46:54.128618: step: 1080/530, loss: 0.01946997083723545 2023-01-24 06:46:55.209568: step: 1084/530, loss: 0.006793544627726078 2023-01-24 06:46:56.246517: step: 1088/530, loss: 0.0008276875596493483 2023-01-24 06:46:57.287914: step: 1092/530, loss: 0.0005426559946499765 2023-01-24 06:46:58.319796: step: 1096/530, loss: 0.010740218684077263 2023-01-24 06:46:59.369639: step: 1100/530, loss: 0.03218856453895569 2023-01-24 06:47:00.420278: step: 1104/530, loss: 0.006087642628699541 2023-01-24 06:47:01.466734: step: 1108/530, loss: 0.003980571404099464 2023-01-24 06:47:02.507194: step: 1112/530, loss: 0.00027696104370988905 2023-01-24 06:47:03.551917: step: 1116/530, loss: 0.0037075176369398832 2023-01-24 06:47:04.596171: step: 1120/530, loss: 0.012608006596565247 2023-01-24 06:47:05.656451: step: 1124/530, loss: 0.003824002342298627 2023-01-24 06:47:06.705081: step: 1128/530, loss: 0.001979410881176591 2023-01-24 06:47:07.756249: step: 1132/530, loss: 0.008721797727048397 2023-01-24 06:47:08.795711: step: 1136/530, loss: 0.004777163732796907 2023-01-24 06:47:09.841715: step: 1140/530, loss: 0.001700170454569161 2023-01-24 06:47:10.913487: step: 1144/530, loss: 0.0046541024930775166 2023-01-24 06:47:11.964828: step: 1148/530, loss: 0.10870716720819473 2023-01-24 06:47:12.997521: step: 1152/530, loss: 0.00021920898871030658 2023-01-24 06:47:14.033890: step: 1156/530, loss: 0.011056621558964252 2023-01-24 06:47:15.095010: step: 1160/530, loss: 0.011159135028719902 2023-01-24 06:47:16.120287: step: 1164/530, loss: 0.0024081047158688307 2023-01-24 06:47:17.156401: step: 1168/530, loss: 0.0057925088331103325 2023-01-24 06:47:18.214248: step: 1172/530, loss: 0.007608622312545776 2023-01-24 06:47:19.257014: step: 1176/530, loss: 1.2015492529826588e-06 2023-01-24 06:47:20.298030: step: 1180/530, loss: 0.020681289955973625 2023-01-24 06:47:21.358929: step: 1184/530, loss: 0.006975239608436823 2023-01-24 06:47:22.404374: step: 1188/530, loss: 0.0026035597547888756 2023-01-24 06:47:23.455237: step: 1192/530, loss: 0.007371784653514624 2023-01-24 06:47:24.499760: step: 1196/530, loss: 0.03399481251835823 2023-01-24 06:47:25.539956: step: 1200/530, loss: 0.011416000314056873 2023-01-24 06:47:26.579735: step: 1204/530, loss: 0.010691234841942787 2023-01-24 06:47:27.629821: step: 1208/530, loss: 0.0019936019089072943 2023-01-24 06:47:28.679204: step: 1212/530, loss: 0.001048463280312717 2023-01-24 06:47:29.739887: step: 1216/530, loss: 0.007577843498438597 2023-01-24 06:47:30.780322: step: 1220/530, loss: 0.004762694239616394 2023-01-24 06:47:31.825864: step: 1224/530, loss: 0.0044346340000629425 2023-01-24 06:47:32.861690: step: 1228/530, loss: 0.00024039229901973158 2023-01-24 06:47:33.923864: step: 1232/530, loss: 0.005222438368946314 2023-01-24 06:47:34.971020: step: 1236/530, loss: 0.0035616266541182995 2023-01-24 06:47:36.015644: step: 1240/530, loss: 0.004955634009093046 2023-01-24 06:47:37.056676: step: 1244/530, loss: 0.010248035192489624 2023-01-24 06:47:38.105118: step: 1248/530, loss: 0.00953050795942545 2023-01-24 06:47:39.162660: step: 1252/530, loss: 0.010992596857249737 2023-01-24 06:47:40.197505: step: 1256/530, loss: 0.005536581855267286 2023-01-24 06:47:41.256893: step: 1260/530, loss: 0.0011358698830008507 2023-01-24 06:47:42.299193: step: 1264/530, loss: 0.002192847430706024 2023-01-24 06:47:43.347655: step: 1268/530, loss: 0.006236623506993055 2023-01-24 06:47:44.398439: step: 1272/530, loss: 0.002121654571965337 2023-01-24 06:47:45.442179: step: 1276/530, loss: 0.00792581308633089 2023-01-24 06:47:46.491144: step: 1280/530, loss: 0.0014265021309256554 2023-01-24 06:47:47.532465: step: 1284/530, loss: 0.007405952550470829 2023-01-24 06:47:48.607159: step: 1288/530, loss: 0.0682988241314888 2023-01-24 06:47:49.656372: step: 1292/530, loss: 6.156717427074909e-05 2023-01-24 06:47:50.696781: step: 1296/530, loss: 0.002823916729539633 2023-01-24 06:47:51.749338: step: 1300/530, loss: 0.017848273739218712 2023-01-24 06:47:52.806339: step: 1304/530, loss: 0.0051645454950630665 2023-01-24 06:47:53.832901: step: 1308/530, loss: 0.0030845499131828547 2023-01-24 06:47:54.874201: step: 1312/530, loss: 0.004272168967872858 2023-01-24 06:47:55.938952: step: 1316/530, loss: 0.006515360437333584 2023-01-24 06:47:57.001481: step: 1320/530, loss: 0.007780950050801039 2023-01-24 06:47:58.061448: step: 1324/530, loss: 0.02745509147644043 2023-01-24 06:47:59.097365: step: 1328/530, loss: 0.009014702402055264 2023-01-24 06:48:00.143545: step: 1332/530, loss: 0.0016517748590558767 2023-01-24 06:48:01.192238: step: 1336/530, loss: 0.004722333047538996 2023-01-24 06:48:02.251895: step: 1340/530, loss: 0.011146903038024902 2023-01-24 06:48:03.299326: step: 1344/530, loss: 0.007080514915287495 2023-01-24 06:48:04.365123: step: 1348/530, loss: 0.004426012746989727 2023-01-24 06:48:05.425171: step: 1352/530, loss: 0.011999353766441345 2023-01-24 06:48:06.486352: step: 1356/530, loss: 0.006804373115301132 2023-01-24 06:48:07.533641: step: 1360/530, loss: 0.006184310186654329 2023-01-24 06:48:08.599560: step: 1364/530, loss: 0.00030462408903986216 2023-01-24 06:48:09.641175: step: 1368/530, loss: 0.004529778379946947 2023-01-24 06:48:10.702080: step: 1372/530, loss: 0.002193887485191226 2023-01-24 06:48:11.734022: step: 1376/530, loss: 0.004749293439090252 2023-01-24 06:48:12.776678: step: 1380/530, loss: 0.011622396297752857 2023-01-24 06:48:13.814503: step: 1384/530, loss: 0.00034916159347631037 2023-01-24 06:48:14.856363: step: 1388/530, loss: 0.006426604930311441 2023-01-24 06:48:15.902688: step: 1392/530, loss: 0.0006140635814517736 2023-01-24 06:48:16.959946: step: 1396/530, loss: 0.006234284956008196 2023-01-24 06:48:18.003056: step: 1400/530, loss: 0.0029865936376154423 2023-01-24 06:48:19.054748: step: 1404/530, loss: 0.01206700224429369 2023-01-24 06:48:20.091338: step: 1408/530, loss: 0.004013594705611467 2023-01-24 06:48:21.122602: step: 1412/530, loss: 0.0014471722533926368 2023-01-24 06:48:22.167330: step: 1416/530, loss: 0.005429612472653389 2023-01-24 06:48:23.209955: step: 1420/530, loss: 0.007490025833249092 2023-01-24 06:48:24.261320: step: 1424/530, loss: 0.012800934724509716 2023-01-24 06:48:25.300210: step: 1428/530, loss: 0.0016171160386875272 2023-01-24 06:48:26.391491: step: 1432/530, loss: 0.0018943685572594404 2023-01-24 06:48:27.443938: step: 1436/530, loss: 0.008185381069779396 2023-01-24 06:48:28.492989: step: 1440/530, loss: 0.001986532937735319 2023-01-24 06:48:29.543430: step: 1444/530, loss: 0.001074748346582055 2023-01-24 06:48:30.604122: step: 1448/530, loss: 0.011742767877876759 2023-01-24 06:48:31.666936: step: 1452/530, loss: 0.0008364357054233551 2023-01-24 06:48:32.706588: step: 1456/530, loss: 0.015845948830246925 2023-01-24 06:48:33.748621: step: 1460/530, loss: 0.0010480317287147045 2023-01-24 06:48:34.795329: step: 1464/530, loss: 0.043194811791181564 2023-01-24 06:48:35.829082: step: 1468/530, loss: 0.0013388304505497217 2023-01-24 06:48:36.887498: step: 1472/530, loss: 0.0005215198616497219 2023-01-24 06:48:37.935747: step: 1476/530, loss: 0.0014749027322977781 2023-01-24 06:48:38.985876: step: 1480/530, loss: 0.006819496396929026 2023-01-24 06:48:40.042153: step: 1484/530, loss: 0.003423040732741356 2023-01-24 06:48:41.095763: step: 1488/530, loss: 0.016143960878252983 2023-01-24 06:48:42.148174: step: 1492/530, loss: 0.008534249849617481 2023-01-24 06:48:43.220802: step: 1496/530, loss: 0.004776821006089449 2023-01-24 06:48:44.279093: step: 1500/530, loss: 0.009061519987881184 2023-01-24 06:48:45.313477: step: 1504/530, loss: 0.0018091071397066116 2023-01-24 06:48:46.358617: step: 1508/530, loss: 0.005445644725114107 2023-01-24 06:48:47.426115: step: 1512/530, loss: 0.001814851420931518 2023-01-24 06:48:48.477214: step: 1516/530, loss: 0.0014321933267638087 2023-01-24 06:48:49.528010: step: 1520/530, loss: 0.00572019862011075 2023-01-24 06:48:50.572683: step: 1524/530, loss: 0.012708782218396664 2023-01-24 06:48:51.621097: step: 1528/530, loss: 0.02738189697265625 2023-01-24 06:48:52.674531: step: 1532/530, loss: 0.003529068548232317 2023-01-24 06:48:53.723658: step: 1536/530, loss: 0.005960469599813223 2023-01-24 06:48:54.771547: step: 1540/530, loss: 0.046080682426691055 2023-01-24 06:48:55.828570: step: 1544/530, loss: 0.0028783243615180254 2023-01-24 06:48:56.878295: step: 1548/530, loss: 0.0029748750384896994 2023-01-24 06:48:57.932831: step: 1552/530, loss: 0.027270717546343803 2023-01-24 06:48:58.988798: step: 1556/530, loss: 0.01137593761086464 2023-01-24 06:49:00.043241: step: 1560/530, loss: 0.006451827008277178 2023-01-24 06:49:01.082396: step: 1564/530, loss: 0.0033235889859497547 2023-01-24 06:49:02.135572: step: 1568/530, loss: 0.008284997195005417 2023-01-24 06:49:03.167408: step: 1572/530, loss: 0.011531743220984936 2023-01-24 06:49:04.214946: step: 1576/530, loss: 0.021130923181772232 2023-01-24 06:49:05.252042: step: 1580/530, loss: 0.010799339041113853 2023-01-24 06:49:06.327148: step: 1584/530, loss: 0.003518350888043642 2023-01-24 06:49:07.386576: step: 1588/530, loss: 0.0009050051448866725 2023-01-24 06:49:08.418220: step: 1592/530, loss: 0.0030564155895262957 2023-01-24 06:49:09.447858: step: 1596/530, loss: 0.0033086545299738646 2023-01-24 06:49:10.497005: step: 1600/530, loss: 0.006984124891459942 2023-01-24 06:49:11.544908: step: 1604/530, loss: 0.005573161877691746 2023-01-24 06:49:12.578374: step: 1608/530, loss: 0.0024158877786248922 2023-01-24 06:49:13.624935: step: 1612/530, loss: 0.0025379215367138386 2023-01-24 06:49:14.670942: step: 1616/530, loss: 0.00045806291745975614 2023-01-24 06:49:15.717303: step: 1620/530, loss: 0.0020665458869189024 2023-01-24 06:49:16.756416: step: 1624/530, loss: 0.00010721674334490672 2023-01-24 06:49:17.810080: step: 1628/530, loss: 0.0020372758153826 2023-01-24 06:49:18.855589: step: 1632/530, loss: 0.0029343198984861374 2023-01-24 06:49:19.922806: step: 1636/530, loss: 0.02106183022260666 2023-01-24 06:49:20.985860: step: 1640/530, loss: 0.011678473092615604 2023-01-24 06:49:22.028881: step: 1644/530, loss: 4.8800025979289785e-05 2023-01-24 06:49:23.093924: step: 1648/530, loss: 0.0067364429123699665 2023-01-24 06:49:24.134056: step: 1652/530, loss: 0.02513057179749012 2023-01-24 06:49:25.167074: step: 1656/530, loss: 0.0007702919538132846 2023-01-24 06:49:26.207774: step: 1660/530, loss: 0.011085661128163338 2023-01-24 06:49:27.246019: step: 1664/530, loss: 0.018413681536912918 2023-01-24 06:49:28.288019: step: 1668/530, loss: 0.011836964637041092 2023-01-24 06:49:29.326338: step: 1672/530, loss: 0.02277711220085621 2023-01-24 06:49:30.376448: step: 1676/530, loss: 0.005979735404253006 2023-01-24 06:49:31.431911: step: 1680/530, loss: 0.007160399109125137 2023-01-24 06:49:32.497019: step: 1684/530, loss: 0.016264263540506363 2023-01-24 06:49:33.554973: step: 1688/530, loss: 0.03354169800877571 2023-01-24 06:49:34.602306: step: 1692/530, loss: 0.000819491920992732 2023-01-24 06:49:35.677688: step: 1696/530, loss: 0.0013716618996113539 2023-01-24 06:49:36.717594: step: 1700/530, loss: 0.0042462474666535854 2023-01-24 06:49:37.752293: step: 1704/530, loss: 0.0013388522202149034 2023-01-24 06:49:38.797878: step: 1708/530, loss: 0.01728525198996067 2023-01-24 06:49:39.854904: step: 1712/530, loss: 0.004231453873217106 2023-01-24 06:49:40.890379: step: 1716/530, loss: 0.007353954017162323 2023-01-24 06:49:41.949922: step: 1720/530, loss: 0.000880862062331289 2023-01-24 06:49:43.005325: step: 1724/530, loss: 0.004798652604222298 2023-01-24 06:49:44.047214: step: 1728/530, loss: 0.004262755159288645 2023-01-24 06:49:45.077015: step: 1732/530, loss: 0.004507008474320173 2023-01-24 06:49:46.123252: step: 1736/530, loss: 0.0017209872603416443 2023-01-24 06:49:47.161259: step: 1740/530, loss: 0.0009803662542253733 2023-01-24 06:49:48.196722: step: 1744/530, loss: 0.0034610687289386988 2023-01-24 06:49:49.235445: step: 1748/530, loss: 0.002741872565820813 2023-01-24 06:49:50.271096: step: 1752/530, loss: 0.00200418708845973 2023-01-24 06:49:51.309649: step: 1756/530, loss: 0.0001717911654850468 2023-01-24 06:49:52.344671: step: 1760/530, loss: 0.006707558874040842 2023-01-24 06:49:53.380871: step: 1764/530, loss: 0.009112262167036533 2023-01-24 06:49:54.420902: step: 1768/530, loss: 0.0028560529462993145 2023-01-24 06:49:55.466762: step: 1772/530, loss: 0.000468336307676509 2023-01-24 06:49:56.517109: step: 1776/530, loss: 0.003938440699130297 2023-01-24 06:49:57.543578: step: 1780/530, loss: 0.022959338501095772 2023-01-24 06:49:58.574044: step: 1784/530, loss: 0.003944477066397667 2023-01-24 06:49:59.614725: step: 1788/530, loss: 0.00030886937747709453 2023-01-24 06:50:00.656843: step: 1792/530, loss: 0.004274178296327591 2023-01-24 06:50:01.695048: step: 1796/530, loss: 0.006106200162321329 2023-01-24 06:50:02.729990: step: 1800/530, loss: 0.0010420207399874926 2023-01-24 06:50:03.795603: step: 1804/530, loss: 0.001296434667892754 2023-01-24 06:50:04.831674: step: 1808/530, loss: 0.0028293104842305183 2023-01-24 06:50:05.896097: step: 1812/530, loss: 0.0039056281093508005 2023-01-24 06:50:06.923841: step: 1816/530, loss: 0.007308308966457844 2023-01-24 06:50:07.968035: step: 1820/530, loss: 0.0011681515024974942 2023-01-24 06:50:09.003337: step: 1824/530, loss: 0.016207758337259293 2023-01-24 06:50:10.051006: step: 1828/530, loss: 0.009423826821148396 2023-01-24 06:50:11.100460: step: 1832/530, loss: 0.006282747723162174 2023-01-24 06:50:12.154243: step: 1836/530, loss: 0.012160269543528557 2023-01-24 06:50:13.210286: step: 1840/530, loss: 0.008822774514555931 2023-01-24 06:50:14.260630: step: 1844/530, loss: 0.02734699286520481 2023-01-24 06:50:15.291940: step: 1848/530, loss: 0.0004367501533124596 2023-01-24 06:50:16.358804: step: 1852/530, loss: 0.04016534239053726 2023-01-24 06:50:17.399194: step: 1856/530, loss: 0.01248511765152216 2023-01-24 06:50:18.440667: step: 1860/530, loss: 8.790144784143195e-05 2023-01-24 06:50:19.485049: step: 1864/530, loss: 0.007806339301168919 2023-01-24 06:50:20.528455: step: 1868/530, loss: 0.0162203311920166 2023-01-24 06:50:21.576701: step: 1872/530, loss: 0.004363378044217825 2023-01-24 06:50:22.632334: step: 1876/530, loss: 0.007265110034495592 2023-01-24 06:50:23.677147: step: 1880/530, loss: 0.00010416420991532505 2023-01-24 06:50:24.723037: step: 1884/530, loss: 0.02013254165649414 2023-01-24 06:50:25.776205: step: 1888/530, loss: 0.006840502377599478 2023-01-24 06:50:26.824856: step: 1892/530, loss: 0.008903981186449528 2023-01-24 06:50:27.866140: step: 1896/530, loss: 0.0036086742766201496 2023-01-24 06:50:28.920896: step: 1900/530, loss: 0.0035077142529189587 2023-01-24 06:50:29.970645: step: 1904/530, loss: 0.02203163132071495 2023-01-24 06:50:31.019085: step: 1908/530, loss: 0.0036880257539451122 2023-01-24 06:50:32.062151: step: 1912/530, loss: 0.0011350263375788927 2023-01-24 06:50:33.134162: step: 1916/530, loss: 0.042768143117427826 2023-01-24 06:50:34.185172: step: 1920/530, loss: 0.007512848824262619 2023-01-24 06:50:35.217165: step: 1924/530, loss: 0.0049897609278559685 2023-01-24 06:50:36.251580: step: 1928/530, loss: 0.006997285410761833 2023-01-24 06:50:37.292140: step: 1932/530, loss: 0.004432953894138336 2023-01-24 06:50:38.353050: step: 1936/530, loss: 0.002418037038296461 2023-01-24 06:50:39.393641: step: 1940/530, loss: 0.009223580360412598 2023-01-24 06:50:40.441840: step: 1944/530, loss: 0.000389400142012164 2023-01-24 06:50:41.479390: step: 1948/530, loss: 0.0002923975698649883 2023-01-24 06:50:42.534339: step: 1952/530, loss: 0.0007302080048248172 2023-01-24 06:50:43.564809: step: 1956/530, loss: 0.0123849306255579 2023-01-24 06:50:44.600662: step: 1960/530, loss: 0.00035092595499008894 2023-01-24 06:50:45.646662: step: 1964/530, loss: 0.01818850077688694 2023-01-24 06:50:46.706661: step: 1968/530, loss: 9.57259635470109e-06 2023-01-24 06:50:47.734238: step: 1972/530, loss: 0.029654745012521744 2023-01-24 06:50:48.766556: step: 1976/530, loss: 0.011064673773944378 2023-01-24 06:50:49.820939: step: 1980/530, loss: 0.0064434814266860485 2023-01-24 06:50:50.884848: step: 1984/530, loss: 0.00473420275375247 2023-01-24 06:50:51.930251: step: 1988/530, loss: 0.031124234199523926 2023-01-24 06:50:52.988995: step: 1992/530, loss: 0.00546392984688282 2023-01-24 06:50:54.036161: step: 1996/530, loss: 0.00029834589804522693 2023-01-24 06:50:55.063112: step: 2000/530, loss: 0.0008198019349947572 2023-01-24 06:50:56.112033: step: 2004/530, loss: 0.0074112857691943645 2023-01-24 06:50:57.155980: step: 2008/530, loss: 0.03172183036804199 2023-01-24 06:50:58.217693: step: 2012/530, loss: 0.00966847687959671 2023-01-24 06:50:59.262304: step: 2016/530, loss: 0.005522883962839842 2023-01-24 06:51:00.308396: step: 2020/530, loss: 0.010048533789813519 2023-01-24 06:51:01.353925: step: 2024/530, loss: 0.01874934323132038 2023-01-24 06:51:02.411676: step: 2028/530, loss: 0.021582117304205894 2023-01-24 06:51:03.469446: step: 2032/530, loss: 0.00030745184631086886 2023-01-24 06:51:04.517119: step: 2036/530, loss: 0.005826187320053577 2023-01-24 06:51:05.565706: step: 2040/530, loss: 0.00044487352715805173 2023-01-24 06:51:06.607441: step: 2044/530, loss: 0.004671136848628521 2023-01-24 06:51:07.674324: step: 2048/530, loss: 0.022065000608563423 2023-01-24 06:51:08.708209: step: 2052/530, loss: 0.0071199387311935425 2023-01-24 06:51:09.740664: step: 2056/530, loss: 0.005276544950902462 2023-01-24 06:51:10.773459: step: 2060/530, loss: 0.006164137274026871 2023-01-24 06:51:11.832502: step: 2064/530, loss: 0.0046063382178545 2023-01-24 06:51:12.870470: step: 2068/530, loss: 0.004582513589411974 2023-01-24 06:51:13.901656: step: 2072/530, loss: 5.838310607941821e-05 2023-01-24 06:51:14.953878: step: 2076/530, loss: 0.013666230253875256 2023-01-24 06:51:15.998752: step: 2080/530, loss: 0.004349856171756983 2023-01-24 06:51:17.051351: step: 2084/530, loss: 0.002444185083732009 2023-01-24 06:51:18.077902: step: 2088/530, loss: 0.00016139236686285585 2023-01-24 06:51:19.129088: step: 2092/530, loss: 0.0032693196553736925 2023-01-24 06:51:20.183108: step: 2096/530, loss: 0.0036651529371738434 2023-01-24 06:51:21.228113: step: 2100/530, loss: 0.013309440575540066 2023-01-24 06:51:22.272607: step: 2104/530, loss: 0.026972614228725433 2023-01-24 06:51:23.326642: step: 2108/530, loss: 0.0032702982425689697 2023-01-24 06:51:24.377115: step: 2112/530, loss: 0.010360381565988064 2023-01-24 06:51:25.422395: step: 2116/530, loss: 0.00747764203697443 2023-01-24 06:51:26.461535: step: 2120/530, loss: 0.003745673457160592 ================================================== Loss: 0.007 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.373875, 'r': 0.3192481024667932, 'f1': 0.34440890481064484}, 'combined': 0.2537749824920541, 'stategy': 1, 'epoch': 9} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37466326926317167, 'r': 0.3898150926524911, 'f1': 0.38208902775307235}, 'combined': 0.2961647009377882, 'stategy': 1, 'epoch': 9} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3820300126702566, 'r': 0.3269365004066143, 'f1': 0.3523426088226702}, 'combined': 0.2596208696588096, 'stategy': 1, 'epoch': 9} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37245743734225994, 'r': 0.3686917831044246, 'f1': 0.3705650438961792}, 'combined': 0.28723223498172745, 'stategy': 1, 'epoch': 9} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3813119159992372, 'r': 0.33283393047371745, 'f1': 0.3554275204856111}, 'combined': 0.26189396246308183, 'stategy': 1, 'epoch': 9} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.35810637630247955, 'r': 0.35909380197243124, 'f1': 0.3585994094043186}, 'combined': 0.2779574369545436, 'stategy': 1, 'epoch': 9} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 9} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 9} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 9} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 10 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 06:53:51.466425: step: 4/530, loss: 0.0007372562540695071 2023-01-24 06:53:52.508380: step: 8/530, loss: 0.0023943197447806597 2023-01-24 06:53:53.543949: step: 12/530, loss: 0.00902405846863985 2023-01-24 06:53:54.579323: step: 16/530, loss: 0.0017045838758349419 2023-01-24 06:53:55.613239: step: 20/530, loss: 0.001977020176127553 2023-01-24 06:53:56.668415: step: 24/530, loss: 0.008408475667238235 2023-01-24 06:53:57.716426: step: 28/530, loss: 0.0114920474588871 2023-01-24 06:53:58.758488: step: 32/530, loss: 0.011747323907911777 2023-01-24 06:53:59.797777: step: 36/530, loss: 0.004281261470168829 2023-01-24 06:54:00.849521: step: 40/530, loss: 0.0032921512611210346 2023-01-24 06:54:01.897531: step: 44/530, loss: 0.008866902440786362 2023-01-24 06:54:02.944777: step: 48/530, loss: 0.018904125317931175 2023-01-24 06:54:03.979671: step: 52/530, loss: 0.0033392130862921476 2023-01-24 06:54:05.030987: step: 56/530, loss: 0.005421266425400972 2023-01-24 06:54:06.072724: step: 60/530, loss: 0.009067226201295853 2023-01-24 06:54:07.121499: step: 64/530, loss: 0.0065969983115792274 2023-01-24 06:54:08.169642: step: 68/530, loss: 0.008009317331016064 2023-01-24 06:54:09.228699: step: 72/530, loss: 0.013463177718222141 2023-01-24 06:54:10.266878: step: 76/530, loss: 0.0029160326812416315 2023-01-24 06:54:11.293100: step: 80/530, loss: 0.004672999959439039 2023-01-24 06:54:12.357757: step: 84/530, loss: 0.01176483929157257 2023-01-24 06:54:13.391762: step: 88/530, loss: 0.007886665873229504 2023-01-24 06:54:14.446996: step: 92/530, loss: 0.00021173500863369554 2023-01-24 06:54:15.486127: step: 96/530, loss: 0.019204547628760338 2023-01-24 06:54:16.524388: step: 100/530, loss: 0.003048920538276434 2023-01-24 06:54:17.574176: step: 104/530, loss: 0.0022282360587269068 2023-01-24 06:54:18.626538: step: 108/530, loss: 0.004905399866402149 2023-01-24 06:54:19.665248: step: 112/530, loss: 0.005961662624031305 2023-01-24 06:54:20.720768: step: 116/530, loss: 0.007057271432131529 2023-01-24 06:54:21.763875: step: 120/530, loss: 0.002001353772357106 2023-01-24 06:54:22.819061: step: 124/530, loss: 0.0018433105433359742 2023-01-24 06:54:23.845141: step: 128/530, loss: 0.011630582623183727 2023-01-24 06:54:24.875108: step: 132/530, loss: 0.0029869202990084887 2023-01-24 06:54:25.914500: step: 136/530, loss: 0.0011986852623522282 2023-01-24 06:54:26.953127: step: 140/530, loss: 0.002449146704748273 2023-01-24 06:54:27.988607: step: 144/530, loss: 0.020743252709507942 2023-01-24 06:54:29.018485: step: 148/530, loss: 0.0008950207848101854 2023-01-24 06:54:30.096351: step: 152/530, loss: 0.0034274004865437746 2023-01-24 06:54:31.125043: step: 156/530, loss: 0.0014131536008790135 2023-01-24 06:54:32.165090: step: 160/530, loss: 0.0008916228543967009 2023-01-24 06:54:33.215783: step: 164/530, loss: 2.6459583750693128e-05 2023-01-24 06:54:34.263043: step: 168/530, loss: 0.00015481121954508126 2023-01-24 06:54:35.313884: step: 172/530, loss: 0.004595068283379078 2023-01-24 06:54:36.363104: step: 176/530, loss: 0.00030887030879966915 2023-01-24 06:54:37.399367: step: 180/530, loss: 0.008959001861512661 2023-01-24 06:54:38.449896: step: 184/530, loss: 0.002212352119386196 2023-01-24 06:54:39.483957: step: 188/530, loss: 0.010870103724300861 2023-01-24 06:54:40.526303: step: 192/530, loss: 0.0008116374956443906 2023-01-24 06:54:41.573536: step: 196/530, loss: 0.004199315793812275 2023-01-24 06:54:42.624600: step: 200/530, loss: 0.0035693382378667593 2023-01-24 06:54:43.680332: step: 204/530, loss: 0.004782579839229584 2023-01-24 06:54:44.730423: step: 208/530, loss: 0.00366653292439878 2023-01-24 06:54:45.779624: step: 212/530, loss: 0.00039043338620103896 2023-01-24 06:54:46.828116: step: 216/530, loss: 0.00421998230740428 2023-01-24 06:54:47.873313: step: 220/530, loss: 0.0039749848656356335 2023-01-24 06:54:48.949143: step: 224/530, loss: 0.0033849908504635096 2023-01-24 06:54:50.003953: step: 228/530, loss: 0.0027289630379527807 2023-01-24 06:54:51.057161: step: 232/530, loss: 0.00621890788897872 2023-01-24 06:54:52.095872: step: 236/530, loss: 0.010404416359961033 2023-01-24 06:54:53.134058: step: 240/530, loss: 0.003086398122832179 2023-01-24 06:54:54.185988: step: 244/530, loss: 0.007119441404938698 2023-01-24 06:54:55.223356: step: 248/530, loss: 0.0016671937191858888 2023-01-24 06:54:56.267812: step: 252/530, loss: 0.00987583864480257 2023-01-24 06:54:57.310630: step: 256/530, loss: 4.836375592276454e-05 2023-01-24 06:54:58.352386: step: 260/530, loss: 0.0005254087154753506 2023-01-24 06:54:59.406369: step: 264/530, loss: 0.01092437468469143 2023-01-24 06:55:00.450782: step: 268/530, loss: 0.0032315377611666918 2023-01-24 06:55:01.507716: step: 272/530, loss: 0.016228090971708298 2023-01-24 06:55:02.530264: step: 276/530, loss: 0.0008727370295673609 2023-01-24 06:55:03.580454: step: 280/530, loss: 0.005138714332133532 2023-01-24 06:55:04.613067: step: 284/530, loss: 0.006291618105024099 2023-01-24 06:55:05.674963: step: 288/530, loss: 0.0036444435827434063 2023-01-24 06:55:06.733392: step: 292/530, loss: 0.0034987344406545162 2023-01-24 06:55:07.800746: step: 296/530, loss: 0.001284444355405867 2023-01-24 06:55:08.858120: step: 300/530, loss: 0.0034343083389103413 2023-01-24 06:55:09.913649: step: 304/530, loss: 0.0031063039787113667 2023-01-24 06:55:10.963979: step: 308/530, loss: 0.0008699197787791491 2023-01-24 06:55:12.014036: step: 312/530, loss: 0.0006428711931221187 2023-01-24 06:55:13.064857: step: 316/530, loss: 0.008117156103253365 2023-01-24 06:55:14.105931: step: 320/530, loss: 0.005441263318061829 2023-01-24 06:55:15.176991: step: 324/530, loss: 0.005114181432873011 2023-01-24 06:55:16.262584: step: 328/530, loss: 0.003404296236112714 2023-01-24 06:55:17.314383: step: 332/530, loss: 0.005627663806080818 2023-01-24 06:55:18.374240: step: 336/530, loss: 0.011175437830388546 2023-01-24 06:55:19.446497: step: 340/530, loss: 0.0010454534785822034 2023-01-24 06:55:20.502244: step: 344/530, loss: 0.004417550750076771 2023-01-24 06:55:21.544599: step: 348/530, loss: 5.890388274565339e-05 2023-01-24 06:55:22.586297: step: 352/530, loss: 0.009437691420316696 2023-01-24 06:55:23.624920: step: 356/530, loss: 0.0017233914695680141 2023-01-24 06:55:24.672925: step: 360/530, loss: 0.0013881383929401636 2023-01-24 06:55:25.706726: step: 364/530, loss: 0.0013716183602809906 2023-01-24 06:55:26.751228: step: 368/530, loss: 0.004239580128341913 2023-01-24 06:55:27.812764: step: 372/530, loss: 0.0029596728272736073 2023-01-24 06:55:28.892743: step: 376/530, loss: 0.002328514354303479 2023-01-24 06:55:29.941889: step: 380/530, loss: 0.005114738829433918 2023-01-24 06:55:30.991316: step: 384/530, loss: 0.016595415771007538 2023-01-24 06:55:32.044529: step: 388/530, loss: 0.006054204888641834 2023-01-24 06:55:33.093082: step: 392/530, loss: 0.00011971151980105788 2023-01-24 06:55:34.132221: step: 396/530, loss: 0.003062792122364044 2023-01-24 06:55:35.193463: step: 400/530, loss: 0.004000066313892603 2023-01-24 06:55:36.246452: step: 404/530, loss: 0.0009041042649187148 2023-01-24 06:55:37.302177: step: 408/530, loss: 0.004386028740555048 2023-01-24 06:55:38.346617: step: 412/530, loss: 0.004916968289762735 2023-01-24 06:55:39.400992: step: 416/530, loss: 0.011079824529588223 2023-01-24 06:55:40.462535: step: 420/530, loss: 0.004672501236200333 2023-01-24 06:55:41.519250: step: 424/530, loss: 0.0028045445214957 2023-01-24 06:55:42.565772: step: 428/530, loss: 0.0009784386493265629 2023-01-24 06:55:43.614403: step: 432/530, loss: 0.0013245128793641925 2023-01-24 06:55:44.644843: step: 436/530, loss: 0.0038161959964782 2023-01-24 06:55:45.699064: step: 440/530, loss: 0.00876330491155386 2023-01-24 06:55:46.743221: step: 444/530, loss: 0.0029141767881810665 2023-01-24 06:55:47.794821: step: 448/530, loss: 0.00021813716739416122 2023-01-24 06:55:48.852339: step: 452/530, loss: 0.0003300993994344026 2023-01-24 06:55:49.908275: step: 456/530, loss: 0.0012417059624567628 2023-01-24 06:55:50.958678: step: 460/530, loss: 0.00444937776774168 2023-01-24 06:55:51.997640: step: 464/530, loss: 0.001703589572571218 2023-01-24 06:55:53.052646: step: 468/530, loss: 0.02460644207894802 2023-01-24 06:55:54.093081: step: 472/530, loss: 0.005276022478938103 2023-01-24 06:55:55.136072: step: 476/530, loss: 0.00010200202814303339 2023-01-24 06:55:56.194559: step: 480/530, loss: 0.0036124333273619413 2023-01-24 06:55:57.240029: step: 484/530, loss: 0.003638251917436719 2023-01-24 06:55:58.292795: step: 488/530, loss: 0.003780804108828306 2023-01-24 06:55:59.333369: step: 492/530, loss: 0.0005541572463698685 2023-01-24 06:56:00.378231: step: 496/530, loss: 0.0037358610425144434 2023-01-24 06:56:01.426089: step: 500/530, loss: 0.0033541028387844563 2023-01-24 06:56:02.472112: step: 504/530, loss: 9.332134504802525e-05 2023-01-24 06:56:03.518704: step: 508/530, loss: 0.0 2023-01-24 06:56:04.560044: step: 512/530, loss: 0.0035010657738894224 2023-01-24 06:56:05.622779: step: 516/530, loss: 0.0036441602278500795 2023-01-24 06:56:06.682298: step: 520/530, loss: 0.002572100842371583 2023-01-24 06:56:07.755469: step: 524/530, loss: 0.00015868218906689435 2023-01-24 06:56:08.830431: step: 528/530, loss: 0.00010934688179986551 2023-01-24 06:56:09.873534: step: 532/530, loss: 0.008732899092137814 2023-01-24 06:56:10.927951: step: 536/530, loss: 0.005267515778541565 2023-01-24 06:56:11.986867: step: 540/530, loss: 0.0009832335636019707 2023-01-24 06:56:13.038457: step: 544/530, loss: 0.005033475812524557 2023-01-24 06:56:14.074953: step: 548/530, loss: 0.0020362003706395626 2023-01-24 06:56:15.137489: step: 552/530, loss: 0.002050328068435192 2023-01-24 06:56:16.192643: step: 556/530, loss: 0.008932351134717464 2023-01-24 06:56:17.242210: step: 560/530, loss: 0.00048724692896939814 2023-01-24 06:56:18.280978: step: 564/530, loss: 0.00021071318769827485 2023-01-24 06:56:19.326535: step: 568/530, loss: 0.0001415097212884575 2023-01-24 06:56:20.371859: step: 572/530, loss: 0.009318580850958824 2023-01-24 06:56:21.422860: step: 576/530, loss: 0.004937023855745792 2023-01-24 06:56:22.470169: step: 580/530, loss: 0.036102116107940674 2023-01-24 06:56:23.526000: step: 584/530, loss: 0.0007588112493976951 2023-01-24 06:56:24.560621: step: 588/530, loss: 0.009392837062478065 2023-01-24 06:56:25.611986: step: 592/530, loss: 0.02177371084690094 2023-01-24 06:56:26.658313: step: 596/530, loss: 0.006736889481544495 2023-01-24 06:56:27.704276: step: 600/530, loss: 0.004126775544136763 2023-01-24 06:56:28.767533: step: 604/530, loss: 0.006093895528465509 2023-01-24 06:56:29.817925: step: 608/530, loss: 0.01033114455640316 2023-01-24 06:56:30.855231: step: 612/530, loss: 0.0054052588529884815 2023-01-24 06:56:31.896328: step: 616/530, loss: 0.018098486587405205 2023-01-24 06:56:32.950758: step: 620/530, loss: 0.01095607690513134 2023-01-24 06:56:34.006512: step: 624/530, loss: 0.004884735681116581 2023-01-24 06:56:35.050210: step: 628/530, loss: 0.003965138923376799 2023-01-24 06:56:36.101502: step: 632/530, loss: 0.002264399314299226 2023-01-24 06:56:37.147052: step: 636/530, loss: 0.00013817149738315493 2023-01-24 06:56:38.197430: step: 640/530, loss: 0.00026588892797008157 2023-01-24 06:56:39.243271: step: 644/530, loss: 0.001550157438032329 2023-01-24 06:56:40.310381: step: 648/530, loss: 0.008443762548267841 2023-01-24 06:56:41.363515: step: 652/530, loss: 0.005830992478877306 2023-01-24 06:56:42.399456: step: 656/530, loss: 0.0004329170915298164 2023-01-24 06:56:43.444953: step: 660/530, loss: 0.02213708870112896 2023-01-24 06:56:44.536312: step: 664/530, loss: 0.005303644575178623 2023-01-24 06:56:45.592855: step: 668/530, loss: 0.0039398204535245895 2023-01-24 06:56:46.633145: step: 672/530, loss: 0.005339667666703463 2023-01-24 06:56:47.709375: step: 676/530, loss: 0.005549273919314146 2023-01-24 06:56:48.754850: step: 680/530, loss: 0.014439555816352367 2023-01-24 06:56:49.788079: step: 684/530, loss: 0.0005124564049765468 2023-01-24 06:56:50.844211: step: 688/530, loss: 0.0043865228071808815 2023-01-24 06:56:51.894147: step: 692/530, loss: 0.0019238080130890012 2023-01-24 06:56:52.954930: step: 696/530, loss: 5.780091214546701e-06 2023-01-24 06:56:53.985561: step: 700/530, loss: 0.004060221835970879 2023-01-24 06:56:55.023659: step: 704/530, loss: 0.0030003520660102367 2023-01-24 06:56:56.061757: step: 708/530, loss: 0.004450484178960323 2023-01-24 06:56:57.106432: step: 712/530, loss: 0.002015204168856144 2023-01-24 06:56:58.181893: step: 716/530, loss: 0.007801043801009655 2023-01-24 06:56:59.222457: step: 720/530, loss: 0.002182956086471677 2023-01-24 06:57:00.261481: step: 724/530, loss: 1.6539946955163032e-05 2023-01-24 06:57:01.304321: step: 728/530, loss: 0.002252360340207815 2023-01-24 06:57:02.355948: step: 732/530, loss: 0.0020012168679386377 2023-01-24 06:57:03.408919: step: 736/530, loss: 0.00020705978386104107 2023-01-24 06:57:04.463897: step: 740/530, loss: 0.0033514276146888733 2023-01-24 06:57:05.513776: step: 744/530, loss: 0.006716678384691477 2023-01-24 06:57:06.555786: step: 748/530, loss: 0.00016646439325995743 2023-01-24 06:57:07.611854: step: 752/530, loss: 0.042862117290496826 2023-01-24 06:57:08.653944: step: 756/530, loss: 0.005601138342171907 2023-01-24 06:57:09.693965: step: 760/530, loss: 0.005318896844983101 2023-01-24 06:57:10.730170: step: 764/530, loss: 0.0002570927026681602 2023-01-24 06:57:11.797668: step: 768/530, loss: 0.00429547531530261 2023-01-24 06:57:12.836982: step: 772/530, loss: 0.01953442580997944 2023-01-24 06:57:13.880378: step: 776/530, loss: 0.005533652845770121 2023-01-24 06:57:14.911844: step: 780/530, loss: 0.003615013090893626 2023-01-24 06:57:15.974643: step: 784/530, loss: 0.0027866351883858442 2023-01-24 06:57:17.023465: step: 788/530, loss: 0.003989127930253744 2023-01-24 06:57:18.069109: step: 792/530, loss: 0.009449250064790249 2023-01-24 06:57:19.124435: step: 796/530, loss: 0.007280644029378891 2023-01-24 06:57:20.182275: step: 800/530, loss: 0.010848934762179852 2023-01-24 06:57:21.230251: step: 804/530, loss: 0.005052474793046713 2023-01-24 06:57:22.272746: step: 808/530, loss: 0.0037409246433526278 2023-01-24 06:57:23.324214: step: 812/530, loss: 0.005573755595833063 2023-01-24 06:57:24.372013: step: 816/530, loss: 0.0037045818753540516 2023-01-24 06:57:25.400305: step: 820/530, loss: 0.000529707467649132 2023-01-24 06:57:26.442660: step: 824/530, loss: 0.01829605922102928 2023-01-24 06:57:27.490538: step: 828/530, loss: 0.0022317995317280293 2023-01-24 06:57:28.521400: step: 832/530, loss: 0.00036393056507222354 2023-01-24 06:57:29.552884: step: 836/530, loss: 0.0003764189314097166 2023-01-24 06:57:30.583460: step: 840/530, loss: 0.004179711919277906 2023-01-24 06:57:31.644729: step: 844/530, loss: 0.0017930822214111686 2023-01-24 06:57:32.691900: step: 848/530, loss: 0.0009661811636760831 2023-01-24 06:57:33.764806: step: 852/530, loss: 0.019975047558546066 2023-01-24 06:57:34.803353: step: 856/530, loss: 0.0006106731598265469 2023-01-24 06:57:35.850244: step: 860/530, loss: 0.01782960072159767 2023-01-24 06:57:36.896447: step: 864/530, loss: 0.0004105751577299088 2023-01-24 06:57:37.934478: step: 868/530, loss: 0.005054058041423559 2023-01-24 06:57:38.978566: step: 872/530, loss: 0.007396685890853405 2023-01-24 06:57:40.029602: step: 876/530, loss: 0.001772705465555191 2023-01-24 06:57:41.060668: step: 880/530, loss: 0.000585298053920269 2023-01-24 06:57:42.095827: step: 884/530, loss: 0.0138911884278059 2023-01-24 06:57:43.166699: step: 888/530, loss: 0.014687693677842617 2023-01-24 06:57:44.206643: step: 892/530, loss: 0.01384313777089119 2023-01-24 06:57:45.245597: step: 896/530, loss: 0.001359553774818778 2023-01-24 06:57:46.289887: step: 900/530, loss: 0.005595955066382885 2023-01-24 06:57:47.332033: step: 904/530, loss: 0.012071708217263222 2023-01-24 06:57:48.392915: step: 908/530, loss: 0.004334148485213518 2023-01-24 06:57:49.451334: step: 912/530, loss: 0.001883754157461226 2023-01-24 06:57:50.498297: step: 916/530, loss: 0.008667264133691788 2023-01-24 06:57:51.551580: step: 920/530, loss: 0.03686615452170372 2023-01-24 06:57:52.605054: step: 924/530, loss: 0.0029824068769812584 2023-01-24 06:57:53.646636: step: 928/530, loss: 0.003981342539191246 2023-01-24 06:57:54.715963: step: 932/530, loss: 0.027510561048984528 2023-01-24 06:57:55.783676: step: 936/530, loss: 0.022754797711968422 2023-01-24 06:57:56.844643: step: 940/530, loss: 0.003511945018544793 2023-01-24 06:57:57.906268: step: 944/530, loss: 0.0035397843457758427 2023-01-24 06:57:58.937603: step: 948/530, loss: 0.004075996577739716 2023-01-24 06:57:59.984167: step: 952/530, loss: 0.0020581826101988554 2023-01-24 06:58:01.046877: step: 956/530, loss: 0.00868846196681261 2023-01-24 06:58:02.092611: step: 960/530, loss: 0.003406491596251726 2023-01-24 06:58:03.159387: step: 964/530, loss: 0.005959927104413509 2023-01-24 06:58:04.208940: step: 968/530, loss: 0.006768408697098494 2023-01-24 06:58:05.255916: step: 972/530, loss: 0.00593695929273963 2023-01-24 06:58:06.312300: step: 976/530, loss: 0.010021916590631008 2023-01-24 06:58:07.346509: step: 980/530, loss: 0.00379653531126678 2023-01-24 06:58:08.390006: step: 984/530, loss: 0.0011425334960222244 2023-01-24 06:58:09.433234: step: 988/530, loss: 0.046871911734342575 2023-01-24 06:58:10.483543: step: 992/530, loss: 0.02045295387506485 2023-01-24 06:58:11.529500: step: 996/530, loss: 0.0010991408489644527 2023-01-24 06:58:12.574216: step: 1000/530, loss: 0.008956157602369785 2023-01-24 06:58:13.615478: step: 1004/530, loss: 0.0007103080279193819 2023-01-24 06:58:14.645062: step: 1008/530, loss: 0.003950471989810467 2023-01-24 06:58:15.688676: step: 1012/530, loss: 0.005394541192799807 2023-01-24 06:58:16.719110: step: 1016/530, loss: 0.006424236577004194 2023-01-24 06:58:17.763526: step: 1020/530, loss: 0.005007125437259674 2023-01-24 06:58:18.822084: step: 1024/530, loss: 0.009094523265957832 2023-01-24 06:58:19.866767: step: 1028/530, loss: 0.014116130769252777 2023-01-24 06:58:20.905648: step: 1032/530, loss: 9.635881724534556e-06 2023-01-24 06:58:21.950104: step: 1036/530, loss: 0.0007864705985412002 2023-01-24 06:58:23.007171: step: 1040/530, loss: 0.0021402963902801275 2023-01-24 06:58:24.057453: step: 1044/530, loss: 0.009299227967858315 2023-01-24 06:58:25.088191: step: 1048/530, loss: 0.00010648762690834701 2023-01-24 06:58:26.138335: step: 1052/530, loss: 0.0003820595738943666 2023-01-24 06:58:27.177753: step: 1056/530, loss: 0.013246774673461914 2023-01-24 06:58:28.216115: step: 1060/530, loss: 0.009429216384887695 2023-01-24 06:58:29.254587: step: 1064/530, loss: 1.1052250101784011e-06 2023-01-24 06:58:30.311367: step: 1068/530, loss: 0.010297033004462719 2023-01-24 06:58:31.354603: step: 1072/530, loss: 0.0019000115571543574 2023-01-24 06:58:32.404720: step: 1076/530, loss: 0.008428475819528103 2023-01-24 06:58:33.474928: step: 1080/530, loss: 0.002425176789984107 2023-01-24 06:58:34.520490: step: 1084/530, loss: 0.00487297959625721 2023-01-24 06:58:35.546430: step: 1088/530, loss: 0.00514750462025404 2023-01-24 06:58:36.582384: step: 1092/530, loss: 0.012974259443581104 2023-01-24 06:58:37.624332: step: 1096/530, loss: 0.0005095039959996939 2023-01-24 06:58:38.682459: step: 1100/530, loss: 0.011658834293484688 2023-01-24 06:58:39.728580: step: 1104/530, loss: 0.002302357694134116 2023-01-24 06:58:40.786521: step: 1108/530, loss: 0.0030269830022007227 2023-01-24 06:58:41.838932: step: 1112/530, loss: 0.01093481294810772 2023-01-24 06:58:42.883257: step: 1116/530, loss: 0.0019961956422775984 2023-01-24 06:58:43.939496: step: 1120/530, loss: 0.019439103081822395 2023-01-24 06:58:44.988043: step: 1124/530, loss: 0.01040840707719326 2023-01-24 06:58:46.049636: step: 1128/530, loss: 0.008950133807957172 2023-01-24 06:58:47.082768: step: 1132/530, loss: 0.002671079942956567 2023-01-24 06:58:48.136906: step: 1136/530, loss: 0.01244097575545311 2023-01-24 06:58:49.175781: step: 1140/530, loss: 0.0014234735863283277 2023-01-24 06:58:50.225216: step: 1144/530, loss: 0.001032823696732521 2023-01-24 06:58:51.273190: step: 1148/530, loss: 0.0031111338175833225 2023-01-24 06:58:52.310699: step: 1152/530, loss: 0.00020250941452104598 2023-01-24 06:58:53.364578: step: 1156/530, loss: 0.005391637794673443 2023-01-24 06:58:54.408901: step: 1160/530, loss: 0.005741727538406849 2023-01-24 06:58:55.460685: step: 1164/530, loss: 0.0009992264676839113 2023-01-24 06:58:56.495156: step: 1168/530, loss: 0.00014529972395393997 2023-01-24 06:58:57.535923: step: 1172/530, loss: 0.002177294110879302 2023-01-24 06:58:58.581539: step: 1176/530, loss: 0.00029257911955937743 2023-01-24 06:58:59.617649: step: 1180/530, loss: 0.0 2023-01-24 06:59:00.666492: step: 1184/530, loss: 0.0031331698410212994 2023-01-24 06:59:01.710736: step: 1188/530, loss: 0.008023147471249104 2023-01-24 06:59:02.753374: step: 1192/530, loss: 0.00203211628831923 2023-01-24 06:59:03.821473: step: 1196/530, loss: 0.000991905340924859 2023-01-24 06:59:04.860393: step: 1200/530, loss: 0.005070593673735857 2023-01-24 06:59:05.902760: step: 1204/530, loss: 0.004027171526104212 2023-01-24 06:59:06.958185: step: 1208/530, loss: 0.004472642205655575 2023-01-24 06:59:08.027904: step: 1212/530, loss: 0.01647268608212471 2023-01-24 06:59:09.059675: step: 1216/530, loss: 0.0056014154106378555 2023-01-24 06:59:10.108608: step: 1220/530, loss: 0.00035225055762566626 2023-01-24 06:59:11.162369: step: 1224/530, loss: 0.0021586057264357805 2023-01-24 06:59:12.212685: step: 1228/530, loss: 0.0012377829989418387 2023-01-24 06:59:13.266344: step: 1232/530, loss: 0.0023653607349842787 2023-01-24 06:59:14.319136: step: 1236/530, loss: 0.0005897342343814671 2023-01-24 06:59:15.365912: step: 1240/530, loss: 0.005260581616312265 2023-01-24 06:59:16.421785: step: 1244/530, loss: 0.002286014147102833 2023-01-24 06:59:17.479262: step: 1248/530, loss: 0.0027143657207489014 2023-01-24 06:59:18.514352: step: 1252/530, loss: 0.003995587583631277 2023-01-24 06:59:19.544519: step: 1256/530, loss: 0.004028848838061094 2023-01-24 06:59:20.585972: step: 1260/530, loss: 0.00884984340518713 2023-01-24 06:59:21.637642: step: 1264/530, loss: 7.619905227329582e-05 2023-01-24 06:59:22.689198: step: 1268/530, loss: 0.003528781235218048 2023-01-24 06:59:23.723559: step: 1272/530, loss: 0.002885366789996624 2023-01-24 06:59:24.760341: step: 1276/530, loss: 0.0005106826429255307 2023-01-24 06:59:25.805826: step: 1280/530, loss: 0.031529735773801804 2023-01-24 06:59:26.843150: step: 1284/530, loss: 0.009394584223628044 2023-01-24 06:59:27.875450: step: 1288/530, loss: 0.0074567291885614395 2023-01-24 06:59:28.923037: step: 1292/530, loss: 0.010632209479808807 2023-01-24 06:59:29.959200: step: 1296/530, loss: 0.0037001834716647863 2023-01-24 06:59:30.995895: step: 1300/530, loss: 0.0012172827264294028 2023-01-24 06:59:32.022843: step: 1304/530, loss: 0.006315297447144985 2023-01-24 06:59:33.064325: step: 1308/530, loss: 0.001121440902352333 2023-01-24 06:59:34.121743: step: 1312/530, loss: 0.0015420080162584782 2023-01-24 06:59:35.183722: step: 1316/530, loss: 0.01011837087571621 2023-01-24 06:59:36.244558: step: 1320/530, loss: 0.0065863714553415775 2023-01-24 06:59:37.285240: step: 1324/530, loss: 0.006901334505528212 2023-01-24 06:59:38.330607: step: 1328/530, loss: 0.0003939066082239151 2023-01-24 06:59:39.365672: step: 1332/530, loss: 0.001131982309743762 2023-01-24 06:59:40.422848: step: 1336/530, loss: 0.0014619502471759915 2023-01-24 06:59:41.470520: step: 1340/530, loss: 0.008542369119822979 2023-01-24 06:59:42.512626: step: 1344/530, loss: 0.003910900093615055 2023-01-24 06:59:43.547764: step: 1348/530, loss: 0.004884009715169668 2023-01-24 06:59:44.585002: step: 1352/530, loss: 0.0007372616673819721 2023-01-24 06:59:45.613904: step: 1356/530, loss: 0.0012824038276448846 2023-01-24 06:59:46.662915: step: 1360/530, loss: 0.0023664666805416346 2023-01-24 06:59:47.694303: step: 1364/530, loss: 0.003511996241286397 2023-01-24 06:59:48.735990: step: 1368/530, loss: 0.0006677159108221531 2023-01-24 06:59:49.784031: step: 1372/530, loss: 0.01030261442065239 2023-01-24 06:59:50.830351: step: 1376/530, loss: 0.021198581904172897 2023-01-24 06:59:51.875141: step: 1380/530, loss: 0.003374363761395216 2023-01-24 06:59:52.911827: step: 1384/530, loss: 0.002790069906041026 2023-01-24 06:59:53.951251: step: 1388/530, loss: 0.010399678722023964 2023-01-24 06:59:54.984921: step: 1392/530, loss: 7.802563777659088e-05 2023-01-24 06:59:56.022318: step: 1396/530, loss: 0.0025065478403121233 2023-01-24 06:59:57.057475: step: 1400/530, loss: 0.002675700467079878 2023-01-24 06:59:58.092917: step: 1404/530, loss: 0.001919111586175859 2023-01-24 06:59:59.131739: step: 1408/530, loss: 0.003553468734025955 2023-01-24 07:00:00.171386: step: 1412/530, loss: 0.007829018868505955 2023-01-24 07:00:01.231890: step: 1416/530, loss: 0.0024773040786385536 2023-01-24 07:00:02.271584: step: 1420/530, loss: 0.006798421498388052 2023-01-24 07:00:03.294318: step: 1424/530, loss: 0.0011663369368761778 2023-01-24 07:00:04.329561: step: 1428/530, loss: 0.0018892490770667791 2023-01-24 07:00:05.376834: step: 1432/530, loss: 0.0055986130610108376 2023-01-24 07:00:06.424411: step: 1436/530, loss: 0.004060044884681702 2023-01-24 07:00:07.444044: step: 1440/530, loss: 0.0001568841253174469 2023-01-24 07:00:08.494372: step: 1444/530, loss: 0.010481741279363632 2023-01-24 07:00:09.538357: step: 1448/530, loss: 0.008694391697645187 2023-01-24 07:00:10.570268: step: 1452/530, loss: 0.008683069609105587 2023-01-24 07:00:11.603573: step: 1456/530, loss: 0.01155092753469944 2023-01-24 07:00:12.663395: step: 1460/530, loss: 0.008806398138403893 2023-01-24 07:00:13.696267: step: 1464/530, loss: 0.0004797578149009496 2023-01-24 07:00:14.737141: step: 1468/530, loss: 0.0009437146945856512 2023-01-24 07:00:15.776562: step: 1472/530, loss: 0.007920672185719013 2023-01-24 07:00:16.824052: step: 1476/530, loss: 0.00047152131446637213 2023-01-24 07:00:17.870618: step: 1480/530, loss: 0.004473808221518993 2023-01-24 07:00:18.913771: step: 1484/530, loss: 5.9020785556640476e-05 2023-01-24 07:00:19.948070: step: 1488/530, loss: 0.017084959894418716 2023-01-24 07:00:20.993623: step: 1492/530, loss: 0.010353378020226955 2023-01-24 07:00:22.041522: step: 1496/530, loss: 0.005473766475915909 2023-01-24 07:00:23.088683: step: 1500/530, loss: 0.010242610238492489 2023-01-24 07:00:24.116154: step: 1504/530, loss: 0.01161864772439003 2023-01-24 07:00:25.139952: step: 1508/530, loss: 0.01610509864985943 2023-01-24 07:00:26.172728: step: 1512/530, loss: 0.006201563868671656 2023-01-24 07:00:27.203556: step: 1516/530, loss: 0.003785045351833105 2023-01-24 07:00:28.246323: step: 1520/530, loss: 0.013776431791484356 2023-01-24 07:00:29.306510: step: 1524/530, loss: 0.002174972789362073 2023-01-24 07:00:30.336781: step: 1528/530, loss: 0.012499798089265823 2023-01-24 07:00:31.380384: step: 1532/530, loss: 0.007475248537957668 2023-01-24 07:00:32.417919: step: 1536/530, loss: 0.004212602507323027 2023-01-24 07:00:33.466811: step: 1540/530, loss: 0.0007367205107584596 2023-01-24 07:00:34.505002: step: 1544/530, loss: 0.005895259790122509 2023-01-24 07:00:35.536511: step: 1548/530, loss: 0.0001304114266531542 2023-01-24 07:00:36.594056: step: 1552/530, loss: 0.00027391480398364365 2023-01-24 07:00:37.646831: step: 1556/530, loss: 0.011168625205755234 2023-01-24 07:00:38.687804: step: 1560/530, loss: 2.434478301438503e-05 2023-01-24 07:00:39.758705: step: 1564/530, loss: 0.0012131110997870564 2023-01-24 07:00:40.798008: step: 1568/530, loss: 0.008057406172156334 2023-01-24 07:00:41.853604: step: 1572/530, loss: 0.0012467375490814447 2023-01-24 07:00:42.893066: step: 1576/530, loss: 0.0026619932614266872 2023-01-24 07:00:43.922652: step: 1580/530, loss: 0.004614337347447872 2023-01-24 07:00:44.968047: step: 1584/530, loss: 0.011366119608283043 2023-01-24 07:00:46.010760: step: 1588/530, loss: 0.005403272807598114 2023-01-24 07:00:47.057934: step: 1592/530, loss: 0.002521159127354622 2023-01-24 07:00:48.095436: step: 1596/530, loss: 0.0016460123006254435 2023-01-24 07:00:49.130162: step: 1600/530, loss: 0.002360695041716099 2023-01-24 07:00:50.172285: step: 1604/530, loss: 0.01360092032700777 2023-01-24 07:00:51.195344: step: 1608/530, loss: 0.00018616866145748645 2023-01-24 07:00:52.234091: step: 1612/530, loss: 0.004114161245524883 2023-01-24 07:00:53.286088: step: 1616/530, loss: 0.0011856280034407973 2023-01-24 07:00:54.324473: step: 1620/530, loss: 0.004183993209153414 2023-01-24 07:00:55.383328: step: 1624/530, loss: 0.004463567398488522 2023-01-24 07:00:56.423633: step: 1628/530, loss: 0.0063022952526807785 2023-01-24 07:00:57.458911: step: 1632/530, loss: 0.003606413723900914 2023-01-24 07:00:58.512461: step: 1636/530, loss: 0.023998545482754707 2023-01-24 07:00:59.555628: step: 1640/530, loss: 0.007433038670569658 2023-01-24 07:01:00.593209: step: 1644/530, loss: 0.009414362721145153 2023-01-24 07:01:01.634506: step: 1648/530, loss: 0.006173159461468458 2023-01-24 07:01:02.697735: step: 1652/530, loss: 0.0019051269628107548 2023-01-24 07:01:03.757062: step: 1656/530, loss: 0.0010178512893617153 2023-01-24 07:01:04.806399: step: 1660/530, loss: 0.012921225279569626 2023-01-24 07:01:05.865865: step: 1664/530, loss: 0.0008176472620107234 2023-01-24 07:01:06.911416: step: 1668/530, loss: 0.00013474744628183544 2023-01-24 07:01:07.960470: step: 1672/530, loss: 0.018266238272190094 2023-01-24 07:01:09.004741: step: 1676/530, loss: 0.0055892253294587135 2023-01-24 07:01:10.034368: step: 1680/530, loss: 0.022537048906087875 2023-01-24 07:01:11.071193: step: 1684/530, loss: 0.006122391205281019 2023-01-24 07:01:12.103841: step: 1688/530, loss: 0.0018234685994684696 2023-01-24 07:01:13.147558: step: 1692/530, loss: 0.001576649839989841 2023-01-24 07:01:14.186318: step: 1696/530, loss: 0.006582121830433607 2023-01-24 07:01:15.244270: step: 1700/530, loss: 0.003203270025551319 2023-01-24 07:01:16.295390: step: 1704/530, loss: 0.010848253965377808 2023-01-24 07:01:17.326864: step: 1708/530, loss: 0.004285692237317562 2023-01-24 07:01:18.371632: step: 1712/530, loss: 0.002168471459299326 2023-01-24 07:01:19.432327: step: 1716/530, loss: 0.010917812585830688 2023-01-24 07:01:20.465369: step: 1720/530, loss: 0.006417870055884123 2023-01-24 07:01:21.515299: step: 1724/530, loss: 0.006473662331700325 2023-01-24 07:01:22.572960: step: 1728/530, loss: 0.005470762494951487 2023-01-24 07:01:23.603382: step: 1732/530, loss: 0.0010238197864964604 2023-01-24 07:01:24.646212: step: 1736/530, loss: 0.0012448985362425447 2023-01-24 07:01:25.684910: step: 1740/530, loss: 0.0032532766927033663 2023-01-24 07:01:26.718436: step: 1744/530, loss: 0.006570354104042053 2023-01-24 07:01:27.754756: step: 1748/530, loss: 0.005573190748691559 2023-01-24 07:01:28.811021: step: 1752/530, loss: 0.0013920385390520096 2023-01-24 07:01:29.842561: step: 1756/530, loss: 0.005858817137777805 2023-01-24 07:01:30.877092: step: 1760/530, loss: 0.009732052683830261 2023-01-24 07:01:31.926925: step: 1764/530, loss: 0.00013912632130086422 2023-01-24 07:01:32.989867: step: 1768/530, loss: 0.029803238809108734 2023-01-24 07:01:34.037077: step: 1772/530, loss: 0.0030895352829247713 2023-01-24 07:01:35.109265: step: 1776/530, loss: 0.0022360854782164097 2023-01-24 07:01:36.160200: step: 1780/530, loss: 0.0047850823029875755 2023-01-24 07:01:37.183601: step: 1784/530, loss: 0.0059539941139519215 2023-01-24 07:01:38.223376: step: 1788/530, loss: 0.003803499508649111 2023-01-24 07:01:39.257093: step: 1792/530, loss: 0.004736559931188822 2023-01-24 07:01:40.300908: step: 1796/530, loss: 0.007367157377302647 2023-01-24 07:01:41.356531: step: 1800/530, loss: 0.002435927977785468 2023-01-24 07:01:42.404855: step: 1804/530, loss: 0.013856090605258942 2023-01-24 07:01:43.431638: step: 1808/530, loss: 0.006727796047925949 2023-01-24 07:01:44.473576: step: 1812/530, loss: 0.0030597266741096973 2023-01-24 07:01:45.522667: step: 1816/530, loss: 0.013682817108929157 2023-01-24 07:01:46.597767: step: 1820/530, loss: 0.01180302631109953 2023-01-24 07:01:47.639280: step: 1824/530, loss: 0.009305909276008606 2023-01-24 07:01:48.683821: step: 1828/530, loss: 0.0026737151201814413 2023-01-24 07:01:49.751388: step: 1832/530, loss: 0.01087513379752636 2023-01-24 07:01:50.798944: step: 1836/530, loss: 0.0030264933593571186 2023-01-24 07:01:51.845544: step: 1840/530, loss: 0.00417698360979557 2023-01-24 07:01:52.906823: step: 1844/530, loss: 0.022523457184433937 2023-01-24 07:01:53.958787: step: 1848/530, loss: 0.011807015165686607 2023-01-24 07:01:54.997868: step: 1852/530, loss: 0.004986438434571028 2023-01-24 07:01:56.037119: step: 1856/530, loss: 0.003538735443726182 2023-01-24 07:01:57.093994: step: 1860/530, loss: 0.003975627478212118 2023-01-24 07:01:58.142623: step: 1864/530, loss: 0.000582256936468184 2023-01-24 07:01:59.186459: step: 1868/530, loss: 0.00802086666226387 2023-01-24 07:02:00.225642: step: 1872/530, loss: 0.003350243903696537 2023-01-24 07:02:01.278646: step: 1876/530, loss: 0.006374271586537361 2023-01-24 07:02:02.323410: step: 1880/530, loss: 0.01305426750332117 2023-01-24 07:02:03.382762: step: 1884/530, loss: 0.005892110522836447 2023-01-24 07:02:04.452581: step: 1888/530, loss: 0.007200535852462053 2023-01-24 07:02:05.500902: step: 1892/530, loss: 0.0033678426407277584 2023-01-24 07:02:06.536013: step: 1896/530, loss: 0.018373841419816017 2023-01-24 07:02:07.583655: step: 1900/530, loss: 0.012094561010599136 2023-01-24 07:02:08.619522: step: 1904/530, loss: 0.024464663118124008 2023-01-24 07:02:09.698143: step: 1908/530, loss: 0.008913002908229828 2023-01-24 07:02:10.745088: step: 1912/530, loss: 0.006913756486028433 2023-01-24 07:02:11.780044: step: 1916/530, loss: 0.011059180833399296 2023-01-24 07:02:12.833495: step: 1920/530, loss: 0.006965978071093559 2023-01-24 07:02:13.873274: step: 1924/530, loss: 0.013344147242605686 2023-01-24 07:02:14.919305: step: 1928/530, loss: 0.0020171429496258497 2023-01-24 07:02:15.969946: step: 1932/530, loss: 0.0006166796083562076 2023-01-24 07:02:17.018913: step: 1936/530, loss: 0.006823674309998751 2023-01-24 07:02:18.052308: step: 1940/530, loss: 0.04783971607685089 2023-01-24 07:02:19.103079: step: 1944/530, loss: 0.003408369841054082 2023-01-24 07:02:20.144887: step: 1948/530, loss: 0.0006025812472216785 2023-01-24 07:02:21.195163: step: 1952/530, loss: 0.0001309165236307308 2023-01-24 07:02:22.223603: step: 1956/530, loss: 0.005067429039627314 2023-01-24 07:02:23.268101: step: 1960/530, loss: 0.0029683129396289587 2023-01-24 07:02:24.308148: step: 1964/530, loss: 0.00875820778310299 2023-01-24 07:02:25.351950: step: 1968/530, loss: 0.013712255284190178 2023-01-24 07:02:26.420661: step: 1972/530, loss: 0.04200352355837822 2023-01-24 07:02:27.482791: step: 1976/530, loss: 0.009647498838603497 2023-01-24 07:02:28.565546: step: 1980/530, loss: 0.06462786346673965 2023-01-24 07:02:29.609540: step: 1984/530, loss: 0.0012632659636437893 2023-01-24 07:02:30.649887: step: 1988/530, loss: 0.0013457417953759432 2023-01-24 07:02:31.684779: step: 1992/530, loss: 0.0013004661304876208 2023-01-24 07:02:32.759833: step: 1996/530, loss: 0.0040257591754198074 2023-01-24 07:02:33.829181: step: 2000/530, loss: 0.006593342870473862 2023-01-24 07:02:34.863227: step: 2004/530, loss: 0.006676852703094482 2023-01-24 07:02:35.912960: step: 2008/530, loss: 0.0016754663083702326 2023-01-24 07:02:36.962310: step: 2012/530, loss: 0.03920523822307587 2023-01-24 07:02:38.018121: step: 2016/530, loss: 0.0031775333918631077 2023-01-24 07:02:39.051934: step: 2020/530, loss: 0.003625443670898676 2023-01-24 07:02:40.083572: step: 2024/530, loss: 0.00023560876434203237 2023-01-24 07:02:41.125740: step: 2028/530, loss: 0.008078127168118954 2023-01-24 07:02:42.185830: step: 2032/530, loss: 0.00219753198325634 2023-01-24 07:02:43.241282: step: 2036/530, loss: 0.003684427822008729 2023-01-24 07:02:44.286153: step: 2040/530, loss: 0.0031191271264106035 2023-01-24 07:02:45.332941: step: 2044/530, loss: 0.015231509692966938 2023-01-24 07:02:46.376492: step: 2048/530, loss: 9.349261381430551e-05 2023-01-24 07:02:47.436113: step: 2052/530, loss: 0.005056777037680149 2023-01-24 07:02:48.484303: step: 2056/530, loss: 0.0019268053583800793 2023-01-24 07:02:49.552451: step: 2060/530, loss: 0.005498030688613653 2023-01-24 07:02:50.615565: step: 2064/530, loss: 0.003108419943600893 2023-01-24 07:02:51.654855: step: 2068/530, loss: 0.0227563064545393 2023-01-24 07:02:52.698738: step: 2072/530, loss: 0.0005292192217893898 2023-01-24 07:02:53.731458: step: 2076/530, loss: 0.007405600976198912 2023-01-24 07:02:54.779125: step: 2080/530, loss: 0.015298421494662762 2023-01-24 07:02:55.812903: step: 2084/530, loss: 0.007334030698984861 2023-01-24 07:02:56.880633: step: 2088/530, loss: 0.005176838021725416 2023-01-24 07:02:57.924594: step: 2092/530, loss: 0.005447547882795334 2023-01-24 07:02:58.955288: step: 2096/530, loss: 0.005433876533061266 2023-01-24 07:03:00.004941: step: 2100/530, loss: 0.0005200489540584385 2023-01-24 07:03:01.049527: step: 2104/530, loss: 0.0005241096368990839 2023-01-24 07:03:02.105789: step: 2108/530, loss: 0.0036094901151955128 2023-01-24 07:03:03.153972: step: 2112/530, loss: 0.0028713929932564497 2023-01-24 07:03:04.218816: step: 2116/530, loss: 0.003516589989885688 2023-01-24 07:03:05.261745: step: 2120/530, loss: 0.002706417115405202 ================================================== Loss: 0.006 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37360033259423503, 'r': 0.319722485768501, 'f1': 0.34456799591002046}, 'combined': 0.25389220751264663, 'stategy': 1, 'epoch': 10} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3764300537154685, 'r': 0.3916533279466088, 'f1': 0.38389082955487414}, 'combined': 0.29756131286071585, 'stategy': 1, 'epoch': 10} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38841283157558326, 'r': 0.3294507319056655, 'f1': 0.35651034027574074}, 'combined': 0.2626918296768616, 'stategy': 1, 'epoch': 10} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3730395733001985, 'r': 0.3696109007514834, 'f1': 0.37131732226926495}, 'combined': 0.2878153407063202, 'stategy': 1, 'epoch': 10} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38179098765787556, 'r': 0.3310787122573987, 'f1': 0.3546310596740836}, 'combined': 0.26130709660195633, 'stategy': 1, 'epoch': 10} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.363814560648306, 'r': 0.3641489490312548, 'f1': 0.3639816780395087}, 'combined': 0.28212933895885367, 'stategy': 1, 'epoch': 10} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 10} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 10} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 10} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 11 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 07:05:30.782203: step: 4/530, loss: 0.014732468873262405 2023-01-24 07:05:31.841481: step: 8/530, loss: 0.0028864946216344833 2023-01-24 07:05:32.874936: step: 12/530, loss: 0.0020161960273981094 2023-01-24 07:05:33.917452: step: 16/530, loss: 0.006533683743327856 2023-01-24 07:05:34.957166: step: 20/530, loss: 0.0011061799013987184 2023-01-24 07:05:35.990070: step: 24/530, loss: 0.0022972780279815197 2023-01-24 07:05:37.023834: step: 28/530, loss: 0.013753408566117287 2023-01-24 07:05:38.054794: step: 32/530, loss: 0.0010170890018343925 2023-01-24 07:05:39.087913: step: 36/530, loss: 0.0029799004551023245 2023-01-24 07:05:40.123036: step: 40/530, loss: 0.004848646931350231 2023-01-24 07:05:41.160656: step: 44/530, loss: 0.013234319165349007 2023-01-24 07:05:42.230211: step: 48/530, loss: 0.0018025626195594668 2023-01-24 07:05:43.272679: step: 52/530, loss: 0.0023839380592107773 2023-01-24 07:05:44.316139: step: 56/530, loss: 0.005948647856712341 2023-01-24 07:05:45.365321: step: 60/530, loss: 0.0006430851062759757 2023-01-24 07:05:46.381330: step: 64/530, loss: 0.017871620133519173 2023-01-24 07:05:47.418927: step: 68/530, loss: 0.0011540284613147378 2023-01-24 07:05:48.471347: step: 72/530, loss: 0.002732044318690896 2023-01-24 07:05:49.524277: step: 76/530, loss: 0.009911269880831242 2023-01-24 07:05:50.578824: step: 80/530, loss: 0.007694334723055363 2023-01-24 07:05:51.622540: step: 84/530, loss: 0.0046738870441913605 2023-01-24 07:05:52.681554: step: 88/530, loss: 0.002184328157454729 2023-01-24 07:05:53.717543: step: 92/530, loss: 0.001338479807600379 2023-01-24 07:05:54.766014: step: 96/530, loss: 0.00044118042569607496 2023-01-24 07:05:55.816192: step: 100/530, loss: 0.006144620478153229 2023-01-24 07:05:56.859208: step: 104/530, loss: 0.0008150660432875156 2023-01-24 07:05:57.905945: step: 108/530, loss: 0.0009665843099355698 2023-01-24 07:05:58.938202: step: 112/530, loss: 0.0027098958380520344 2023-01-24 07:05:59.971022: step: 116/530, loss: 0.003707784228026867 2023-01-24 07:06:01.028626: step: 120/530, loss: 0.005503206048160791 2023-01-24 07:06:02.060028: step: 124/530, loss: 6.726011633872986e-05 2023-01-24 07:06:03.096979: step: 128/530, loss: 0.006648343056440353 2023-01-24 07:06:04.147413: step: 132/530, loss: 0.005515591241419315 2023-01-24 07:06:05.183968: step: 136/530, loss: 0.003134507220238447 2023-01-24 07:06:06.233256: step: 140/530, loss: 0.0019207580480724573 2023-01-24 07:06:07.273796: step: 144/530, loss: 0.0049347528256475925 2023-01-24 07:06:08.311200: step: 148/530, loss: 0.0008868713048286736 2023-01-24 07:06:09.358244: step: 152/530, loss: 0.004488816950470209 2023-01-24 07:06:10.415996: step: 156/530, loss: 0.0003686470736283809 2023-01-24 07:06:11.478250: step: 160/530, loss: 0.00496239960193634 2023-01-24 07:06:12.532602: step: 164/530, loss: 0.007017552852630615 2023-01-24 07:06:13.582010: step: 168/530, loss: 0.006619418039917946 2023-01-24 07:06:14.619033: step: 172/530, loss: 0.00120442733168602 2023-01-24 07:06:15.667602: step: 176/530, loss: 0.003372407518327236 2023-01-24 07:06:16.706382: step: 180/530, loss: 0.0007262969156727195 2023-01-24 07:06:17.757219: step: 184/530, loss: 0.0002291992277605459 2023-01-24 07:06:18.804458: step: 188/530, loss: 0.006633590906858444 2023-01-24 07:06:19.871744: step: 192/530, loss: 0.013781595043838024 2023-01-24 07:06:20.910888: step: 196/530, loss: 0.00397269893437624 2023-01-24 07:06:21.971885: step: 200/530, loss: 0.003798141609877348 2023-01-24 07:06:23.023810: step: 204/530, loss: 7.607981387991458e-05 2023-01-24 07:06:24.067001: step: 208/530, loss: 0.006034656427800655 2023-01-24 07:06:25.133723: step: 212/530, loss: 0.006624757777899504 2023-01-24 07:06:26.193476: step: 216/530, loss: 0.004910145420581102 2023-01-24 07:06:27.255271: step: 220/530, loss: 0.007574915885925293 2023-01-24 07:06:28.288356: step: 224/530, loss: 0.0004487109836190939 2023-01-24 07:06:29.357465: step: 228/530, loss: 0.005052222870290279 2023-01-24 07:06:30.400951: step: 232/530, loss: 0.003695308230817318 2023-01-24 07:06:31.438330: step: 236/530, loss: 0.005169919226318598 2023-01-24 07:06:32.493497: step: 240/530, loss: 0.0016193906776607037 2023-01-24 07:06:33.537498: step: 244/530, loss: 0.010608610697090626 2023-01-24 07:06:34.575939: step: 248/530, loss: 0.0003077667788602412 2023-01-24 07:06:35.630751: step: 252/530, loss: 0.0021962961181998253 2023-01-24 07:06:36.685114: step: 256/530, loss: 0.0013021163176745176 2023-01-24 07:06:37.741737: step: 260/530, loss: 0.00019832153338938951 2023-01-24 07:06:38.782453: step: 264/530, loss: 0.0001702180306892842 2023-01-24 07:06:39.853504: step: 268/530, loss: 0.0016734946984797716 2023-01-24 07:06:40.923220: step: 272/530, loss: 0.004190403502434492 2023-01-24 07:06:41.972746: step: 276/530, loss: 0.0017102285055443645 2023-01-24 07:06:43.005058: step: 280/530, loss: 0.003818391589447856 2023-01-24 07:06:44.043207: step: 284/530, loss: 0.0009121823241002858 2023-01-24 07:06:45.094767: step: 288/530, loss: 0.004632391035556793 2023-01-24 07:06:46.153558: step: 292/530, loss: 0.0039497497491538525 2023-01-24 07:06:47.208165: step: 296/530, loss: 0.0010743652237579226 2023-01-24 07:06:48.250069: step: 300/530, loss: 0.005997119937092066 2023-01-24 07:06:49.303117: step: 304/530, loss: 0.0011809875722974539 2023-01-24 07:06:50.350468: step: 308/530, loss: 0.0005545815220102668 2023-01-24 07:06:51.387361: step: 312/530, loss: 0.003112263511866331 2023-01-24 07:06:52.436295: step: 316/530, loss: 0.0022529102861881256 2023-01-24 07:06:53.489895: step: 320/530, loss: 0.0014832214219495654 2023-01-24 07:06:54.524331: step: 324/530, loss: 0.00045701867202296853 2023-01-24 07:06:55.582065: step: 328/530, loss: 0.002436557086184621 2023-01-24 07:06:56.631275: step: 332/530, loss: 0.004066962283104658 2023-01-24 07:06:57.680851: step: 336/530, loss: 0.00031431170646101236 2023-01-24 07:06:58.716654: step: 340/530, loss: 0.005977662745863199 2023-01-24 07:06:59.772052: step: 344/530, loss: 0.018425919115543365 2023-01-24 07:07:00.822101: step: 348/530, loss: 0.009702183306217194 2023-01-24 07:07:01.869824: step: 352/530, loss: 0.007989713922142982 2023-01-24 07:07:02.932221: step: 356/530, loss: 0.006221592891961336 2023-01-24 07:07:03.979153: step: 360/530, loss: 0.0003509514208417386 2023-01-24 07:07:05.044070: step: 364/530, loss: 0.02458922192454338 2023-01-24 07:07:06.096432: step: 368/530, loss: 0.004374512936919928 2023-01-24 07:07:07.151304: step: 372/530, loss: 0.0014963810099288821 2023-01-24 07:07:08.207331: step: 376/530, loss: 0.006841498427093029 2023-01-24 07:07:09.249693: step: 380/530, loss: 0.001976480707526207 2023-01-24 07:07:10.291417: step: 384/530, loss: 0.006298382300883532 2023-01-24 07:07:11.327599: step: 388/530, loss: 0.0032454037573188543 2023-01-24 07:07:12.375805: step: 392/530, loss: 0.00010955317702610046 2023-01-24 07:07:13.427855: step: 396/530, loss: 0.008563480339944363 2023-01-24 07:07:14.450969: step: 400/530, loss: 2.296617367392173e-06 2023-01-24 07:07:15.482309: step: 404/530, loss: 0.0125796590000391 2023-01-24 07:07:16.552233: step: 408/530, loss: 0.006920378189533949 2023-01-24 07:07:17.579541: step: 412/530, loss: 2.2984605152487347e-07 2023-01-24 07:07:18.642234: step: 416/530, loss: 0.011919056065380573 2023-01-24 07:07:19.698254: step: 420/530, loss: 0.005392361897975206 2023-01-24 07:07:20.747762: step: 424/530, loss: 0.00046365190064534545 2023-01-24 07:07:21.800453: step: 428/530, loss: 4.5761949877487496e-05 2023-01-24 07:07:22.838834: step: 432/530, loss: 0.00209265248849988 2023-01-24 07:07:23.868673: step: 436/530, loss: 0.00043662512325681746 2023-01-24 07:07:24.933595: step: 440/530, loss: 0.0016920986818149686 2023-01-24 07:07:25.985635: step: 444/530, loss: 0.0062765441834926605 2023-01-24 07:07:27.027466: step: 448/530, loss: 0.004424261394888163 2023-01-24 07:07:28.089858: step: 452/530, loss: 3.123496935586445e-05 2023-01-24 07:07:29.136716: step: 456/530, loss: 0.009037133306264877 2023-01-24 07:07:30.174836: step: 460/530, loss: 0.005026660859584808 2023-01-24 07:07:31.210606: step: 464/530, loss: 0.019944775849580765 2023-01-24 07:07:32.259342: step: 468/530, loss: 0.00170858611818403 2023-01-24 07:07:33.308191: step: 472/530, loss: 0.002845579292625189 2023-01-24 07:07:34.363042: step: 476/530, loss: 7.603465746797156e-06 2023-01-24 07:07:35.398746: step: 480/530, loss: 0.002625692170113325 2023-01-24 07:07:36.453915: step: 484/530, loss: 0.010671021416783333 2023-01-24 07:07:37.509796: step: 488/530, loss: 0.0012438567355275154 2023-01-24 07:07:38.554900: step: 492/530, loss: 0.0005785999237559736 2023-01-24 07:07:39.608539: step: 496/530, loss: 0.00040261042886413634 2023-01-24 07:07:40.668160: step: 500/530, loss: 0.0013927269028499722 2023-01-24 07:07:41.719767: step: 504/530, loss: 0.013707629404962063 2023-01-24 07:07:42.767454: step: 508/530, loss: 0.033509571105241776 2023-01-24 07:07:43.841977: step: 512/530, loss: 0.0035408353433012962 2023-01-24 07:07:44.874698: step: 516/530, loss: 0.004781695548444986 2023-01-24 07:07:45.925537: step: 520/530, loss: 0.01198268961161375 2023-01-24 07:07:46.974655: step: 524/530, loss: 0.0027435270603746176 2023-01-24 07:07:48.033977: step: 528/530, loss: 0.005994144827127457 2023-01-24 07:07:49.078299: step: 532/530, loss: 0.0030710676219314337 2023-01-24 07:07:50.118910: step: 536/530, loss: 0.005427483003586531 2023-01-24 07:07:51.185575: step: 540/530, loss: 0.006961643695831299 2023-01-24 07:07:52.237596: step: 544/530, loss: 0.008791901171207428 2023-01-24 07:07:53.283177: step: 548/530, loss: 0.01079469732940197 2023-01-24 07:07:54.328031: step: 552/530, loss: 0.004237785469740629 2023-01-24 07:07:55.380499: step: 556/530, loss: 0.0012691307347267866 2023-01-24 07:07:56.446922: step: 560/530, loss: 0.0028314045630395412 2023-01-24 07:07:57.491666: step: 564/530, loss: 0.006784523371607065 2023-01-24 07:07:58.590685: step: 568/530, loss: 0.0025259586982429028 2023-01-24 07:07:59.619248: step: 572/530, loss: 0.00791935808956623 2023-01-24 07:08:00.676271: step: 576/530, loss: 0.011753004975616932 2023-01-24 07:08:01.729268: step: 580/530, loss: 0.0011276863515377045 2023-01-24 07:08:02.786303: step: 584/530, loss: 0.0020637616980820894 2023-01-24 07:08:03.851542: step: 588/530, loss: 0.0011130035854876041 2023-01-24 07:08:04.887185: step: 592/530, loss: 0.0008342540240846574 2023-01-24 07:08:05.940672: step: 596/530, loss: 0.0031309123151004314 2023-01-24 07:08:06.988300: step: 600/530, loss: 0.00013287067122291774 2023-01-24 07:08:08.058066: step: 604/530, loss: 0.0010609551100060344 2023-01-24 07:08:09.102748: step: 608/530, loss: 0.0010218010284006596 2023-01-24 07:08:10.147450: step: 612/530, loss: 0.0026290242094546556 2023-01-24 07:08:11.217524: step: 616/530, loss: 0.004376406781375408 2023-01-24 07:08:12.271125: step: 620/530, loss: 0.007087917998433113 2023-01-24 07:08:13.309722: step: 624/530, loss: 0.0009887524647638202 2023-01-24 07:08:14.351650: step: 628/530, loss: 0.001968992408365011 2023-01-24 07:08:15.407007: step: 632/530, loss: 0.005853585433214903 2023-01-24 07:08:16.448272: step: 636/530, loss: 0.0028284352738410234 2023-01-24 07:08:17.516054: step: 640/530, loss: 0.0052115130238235 2023-01-24 07:08:18.577027: step: 644/530, loss: 0.0021591002587229013 2023-01-24 07:08:19.622964: step: 648/530, loss: 0.0015258598141372204 2023-01-24 07:08:20.671936: step: 652/530, loss: 0.0013785124756395817 2023-01-24 07:08:21.728205: step: 656/530, loss: 0.0057843835093081 2023-01-24 07:08:22.771654: step: 660/530, loss: 0.0005512493080459535 2023-01-24 07:08:23.804701: step: 664/530, loss: 0.0026957234367728233 2023-01-24 07:08:24.864590: step: 668/530, loss: 0.0016912787687033415 2023-01-24 07:08:25.917843: step: 672/530, loss: 0.000615813594777137 2023-01-24 07:08:26.965646: step: 676/530, loss: 0.0016245465958490968 2023-01-24 07:08:28.017558: step: 680/530, loss: 0.00029056810308247805 2023-01-24 07:08:29.064850: step: 684/530, loss: 0.009288286790251732 2023-01-24 07:08:30.116692: step: 688/530, loss: 0.0038950475864112377 2023-01-24 07:08:31.174620: step: 692/530, loss: 0.014622300863265991 2023-01-24 07:08:32.238802: step: 696/530, loss: 0.000449638202553615 2023-01-24 07:08:33.276488: step: 700/530, loss: 0.0030872058123350143 2023-01-24 07:08:34.305125: step: 704/530, loss: 0.010924331843852997 2023-01-24 07:08:35.362636: step: 708/530, loss: 0.021274017170071602 2023-01-24 07:08:36.416452: step: 712/530, loss: 0.002134650945663452 2023-01-24 07:08:37.456664: step: 716/530, loss: 0.007354495581239462 2023-01-24 07:08:38.521165: step: 720/530, loss: 0.0027587036602199078 2023-01-24 07:08:39.564383: step: 724/530, loss: 0.0041638207621872425 2023-01-24 07:08:40.602192: step: 728/530, loss: 0.004001552704721689 2023-01-24 07:08:41.660810: step: 732/530, loss: 0.019353656098246574 2023-01-24 07:08:42.721538: step: 736/530, loss: 0.016189612448215485 2023-01-24 07:08:43.772964: step: 740/530, loss: 0.0039147185161709785 2023-01-24 07:08:44.826312: step: 744/530, loss: 0.002381126396358013 2023-01-24 07:08:45.868434: step: 748/530, loss: 0.007057988550513983 2023-01-24 07:08:46.929078: step: 752/530, loss: 0.0011352099245414138 2023-01-24 07:08:47.970624: step: 756/530, loss: 0.0017084140563383698 2023-01-24 07:08:49.029692: step: 760/530, loss: 0.00591560173779726 2023-01-24 07:08:50.085821: step: 764/530, loss: 0.0031700143590569496 2023-01-24 07:08:51.139505: step: 768/530, loss: 0.005508203990757465 2023-01-24 07:08:52.176293: step: 772/530, loss: 0.003756421385332942 2023-01-24 07:08:53.236239: step: 776/530, loss: 0.004410235211253166 2023-01-24 07:08:54.274255: step: 780/530, loss: 0.005047455430030823 2023-01-24 07:08:55.352427: step: 784/530, loss: 0.02436165325343609 2023-01-24 07:08:56.407093: step: 788/530, loss: 0.004335152916610241 2023-01-24 07:08:57.457202: step: 792/530, loss: 2.823642546445626e-07 2023-01-24 07:08:58.523686: step: 796/530, loss: 0.005086805205792189 2023-01-24 07:08:59.583798: step: 800/530, loss: 0.03161008283495903 2023-01-24 07:09:00.628088: step: 804/530, loss: 0.006230564787983894 2023-01-24 07:09:01.707200: step: 808/530, loss: 0.04716207832098007 2023-01-24 07:09:02.755201: step: 812/530, loss: 0.0014297384768724442 2023-01-24 07:09:03.800537: step: 816/530, loss: 0.005765952169895172 2023-01-24 07:09:04.843098: step: 820/530, loss: 0.013006582856178284 2023-01-24 07:09:05.893670: step: 824/530, loss: 0.005235032178461552 2023-01-24 07:09:06.941484: step: 828/530, loss: 0.0016357704298570752 2023-01-24 07:09:07.987824: step: 832/530, loss: 0.006815879140049219 2023-01-24 07:09:09.031925: step: 836/530, loss: 0.004032469354569912 2023-01-24 07:09:10.093536: step: 840/530, loss: 0.002506756689399481 2023-01-24 07:09:11.152258: step: 844/530, loss: 0.004679025150835514 2023-01-24 07:09:12.208599: step: 848/530, loss: 0.00025164702674373984 2023-01-24 07:09:13.249719: step: 852/530, loss: 0.002013260265812278 2023-01-24 07:09:14.291290: step: 856/530, loss: 0.0005976912216283381 2023-01-24 07:09:15.346371: step: 860/530, loss: 0.013096915557980537 2023-01-24 07:09:16.405448: step: 864/530, loss: 0.007861674763262272 2023-01-24 07:09:17.445437: step: 868/530, loss: 0.007597321644425392 2023-01-24 07:09:18.469370: step: 872/530, loss: 0.001777428900822997 2023-01-24 07:09:19.520366: step: 876/530, loss: 0.014843094162642956 2023-01-24 07:09:20.587837: step: 880/530, loss: 0.026443898677825928 2023-01-24 07:09:21.635738: step: 884/530, loss: 0.0011534770019352436 2023-01-24 07:09:22.693078: step: 888/530, loss: 0.00039898071554489434 2023-01-24 07:09:23.747833: step: 892/530, loss: 0.006618919316679239 2023-01-24 07:09:24.803299: step: 896/530, loss: 0.008538229390978813 2023-01-24 07:09:25.838584: step: 900/530, loss: 0.005873043555766344 2023-01-24 07:09:26.915569: step: 904/530, loss: 0.012603625655174255 2023-01-24 07:09:27.981661: step: 908/530, loss: 0.004822163376957178 2023-01-24 07:09:29.039772: step: 912/530, loss: 0.0022861638572067022 2023-01-24 07:09:30.089011: step: 916/530, loss: 0.009433708153665066 2023-01-24 07:09:31.143617: step: 920/530, loss: 0.0018214863957837224 2023-01-24 07:09:32.197792: step: 924/530, loss: 0.001309029757976532 2023-01-24 07:09:33.297556: step: 928/530, loss: 0.03557188808917999 2023-01-24 07:09:34.335602: step: 932/530, loss: 0.007164108566939831 2023-01-24 07:09:35.382745: step: 936/530, loss: 0.0006070815143175423 2023-01-24 07:09:36.422719: step: 940/530, loss: 0.005502901040017605 2023-01-24 07:09:37.455366: step: 944/530, loss: 0.0027077256236225367 2023-01-24 07:09:38.494222: step: 948/530, loss: 0.004954319912940264 2023-01-24 07:09:39.552456: step: 952/530, loss: 0.005388965364545584 2023-01-24 07:09:40.589463: step: 956/530, loss: 0.005542172584682703 2023-01-24 07:09:41.636822: step: 960/530, loss: 0.006731236819177866 2023-01-24 07:09:42.682307: step: 964/530, loss: 0.006250726990401745 2023-01-24 07:09:43.740769: step: 968/530, loss: 0.010224927216768265 2023-01-24 07:09:44.812138: step: 972/530, loss: 0.009152201004326344 2023-01-24 07:09:45.869411: step: 976/530, loss: 0.0055384766310453415 2023-01-24 07:09:46.916343: step: 980/530, loss: 1.5087374549693777e-07 2023-01-24 07:09:47.976599: step: 984/530, loss: 0.005073467269539833 2023-01-24 07:09:49.022068: step: 988/530, loss: 0.002183017088100314 2023-01-24 07:09:50.069469: step: 992/530, loss: 0.004343661945313215 2023-01-24 07:09:51.130419: step: 996/530, loss: 0.0021708407439291477 2023-01-24 07:09:52.188226: step: 1000/530, loss: 0.0024626783560961485 2023-01-24 07:09:53.234883: step: 1004/530, loss: 0.0016927821561694145 2023-01-24 07:09:54.288351: step: 1008/530, loss: 0.0043599558994174 2023-01-24 07:09:55.342277: step: 1012/530, loss: 0.0026770462282001972 2023-01-24 07:09:56.383244: step: 1016/530, loss: 0.002781082410365343 2023-01-24 07:09:57.429588: step: 1020/530, loss: 0.004273316357284784 2023-01-24 07:09:58.469524: step: 1024/530, loss: 0.00024193669378291816 2023-01-24 07:09:59.533535: step: 1028/530, loss: 0.00485656363889575 2023-01-24 07:10:00.586343: step: 1032/530, loss: 0.004452936816960573 2023-01-24 07:10:01.636635: step: 1036/530, loss: 0.0025070100091397762 2023-01-24 07:10:02.692947: step: 1040/530, loss: 0.001395134488120675 2023-01-24 07:10:03.741015: step: 1044/530, loss: 0.00028120604110881686 2023-01-24 07:10:04.788687: step: 1048/530, loss: 0.0003076897992286831 2023-01-24 07:10:05.838028: step: 1052/530, loss: 0.0025341338478028774 2023-01-24 07:10:06.883443: step: 1056/530, loss: 0.006551379803568125 2023-01-24 07:10:07.922967: step: 1060/530, loss: 0.005033473484218121 2023-01-24 07:10:08.962451: step: 1064/530, loss: 0.008835405111312866 2023-01-24 07:10:10.027942: step: 1068/530, loss: 0.0028214084450155497 2023-01-24 07:10:11.079844: step: 1072/530, loss: 0.008950789459049702 2023-01-24 07:10:12.117462: step: 1076/530, loss: 0.0014356850879266858 2023-01-24 07:10:13.150939: step: 1080/530, loss: 0.00247561139985919 2023-01-24 07:10:14.198306: step: 1084/530, loss: 0.01638169027864933 2023-01-24 07:10:15.248881: step: 1088/530, loss: 0.0026480292435735464 2023-01-24 07:10:16.332232: step: 1092/530, loss: 0.005513367708772421 2023-01-24 07:10:17.367418: step: 1096/530, loss: 0.0071080029010772705 2023-01-24 07:10:18.404337: step: 1100/530, loss: 0.008038556203246117 2023-01-24 07:10:19.441790: step: 1104/530, loss: 0.0076973047107458115 2023-01-24 07:10:20.478611: step: 1108/530, loss: 0.006864570081233978 2023-01-24 07:10:21.520574: step: 1112/530, loss: 0.006138910073786974 2023-01-24 07:10:22.557886: step: 1116/530, loss: 0.003295325906947255 2023-01-24 07:10:23.606455: step: 1120/530, loss: 0.0032680127769708633 2023-01-24 07:10:24.642402: step: 1124/530, loss: 0.0033776836935430765 2023-01-24 07:10:25.708791: step: 1128/530, loss: 7.359675691986922e-06 2023-01-24 07:10:26.748302: step: 1132/530, loss: 0.00015860758139751852 2023-01-24 07:10:27.778246: step: 1136/530, loss: 0.0003294216876383871 2023-01-24 07:10:28.828690: step: 1140/530, loss: 0.003498536068946123 2023-01-24 07:10:29.879798: step: 1144/530, loss: 0.0031569499988108873 2023-01-24 07:10:30.929349: step: 1148/530, loss: 0.0011496113147586584 2023-01-24 07:10:31.981776: step: 1152/530, loss: 0.001786165637895465 2023-01-24 07:10:33.018450: step: 1156/530, loss: 0.004533456638455391 2023-01-24 07:10:34.052417: step: 1160/530, loss: 0.013620489276945591 2023-01-24 07:10:35.093353: step: 1164/530, loss: 0.0005204153130762279 2023-01-24 07:10:36.128548: step: 1168/530, loss: 0.0036813293118029833 2023-01-24 07:10:37.176601: step: 1172/530, loss: 0.0005867261788807809 2023-01-24 07:10:38.235781: step: 1176/530, loss: 0.0030796497594565153 2023-01-24 07:10:39.274754: step: 1180/530, loss: 0.0002512074715923518 2023-01-24 07:10:40.326385: step: 1184/530, loss: 0.03189973533153534 2023-01-24 07:10:41.372773: step: 1188/530, loss: 0.0011992198415100574 2023-01-24 07:10:42.413045: step: 1192/530, loss: 0.010631580837070942 2023-01-24 07:10:43.448321: step: 1196/530, loss: 0.009094943292438984 2023-01-24 07:10:44.481447: step: 1200/530, loss: 0.0006700368248857558 2023-01-24 07:10:45.528741: step: 1204/530, loss: 0.003930522594600916 2023-01-24 07:10:46.573973: step: 1208/530, loss: 0.002903315704315901 2023-01-24 07:10:47.614402: step: 1212/530, loss: 0.004415900446474552 2023-01-24 07:10:48.651649: step: 1216/530, loss: 0.0010305369505658746 2023-01-24 07:10:49.703470: step: 1220/530, loss: 0.006731036584824324 2023-01-24 07:10:50.748131: step: 1224/530, loss: 0.00722704129293561 2023-01-24 07:10:51.787650: step: 1228/530, loss: 0.018307218328118324 2023-01-24 07:10:52.850109: step: 1232/530, loss: 0.05539613589644432 2023-01-24 07:10:53.890806: step: 1236/530, loss: 0.0029454559553414583 2023-01-24 07:10:54.944163: step: 1240/530, loss: 0.007397875189781189 2023-01-24 07:10:55.996064: step: 1244/530, loss: 0.0032214312814176083 2023-01-24 07:10:57.045495: step: 1248/530, loss: 0.003888509701937437 2023-01-24 07:10:58.084797: step: 1252/530, loss: 0.009760660119354725 2023-01-24 07:10:59.118646: step: 1256/530, loss: 0.007573803421109915 2023-01-24 07:11:00.171581: step: 1260/530, loss: 0.022202182561159134 2023-01-24 07:11:01.220677: step: 1264/530, loss: 0.005713118240237236 2023-01-24 07:11:02.264352: step: 1268/530, loss: 0.004170641303062439 2023-01-24 07:11:03.331907: step: 1272/530, loss: 0.004473092500120401 2023-01-24 07:11:04.371009: step: 1276/530, loss: 0.011876476928591728 2023-01-24 07:11:05.409446: step: 1280/530, loss: 0.005746433511376381 2023-01-24 07:11:06.454856: step: 1284/530, loss: 0.0008601548615843058 2023-01-24 07:11:07.499443: step: 1288/530, loss: 0.005444884765893221 2023-01-24 07:11:08.556983: step: 1292/530, loss: 0.024241046980023384 2023-01-24 07:11:09.610090: step: 1296/530, loss: 0.0017819450004026294 2023-01-24 07:11:10.647420: step: 1300/530, loss: 0.01759078912436962 2023-01-24 07:11:11.688215: step: 1304/530, loss: 0.0006419402780011296 2023-01-24 07:11:12.723222: step: 1308/530, loss: 0.009541204199194908 2023-01-24 07:11:13.774365: step: 1312/530, loss: 0.00030007094028405845 2023-01-24 07:11:14.829443: step: 1316/530, loss: 0.004012543708086014 2023-01-24 07:11:15.858713: step: 1320/530, loss: 0.003850433975458145 2023-01-24 07:11:16.898314: step: 1324/530, loss: 0.001178127247840166 2023-01-24 07:11:17.942709: step: 1328/530, loss: 0.007947556674480438 2023-01-24 07:11:18.999293: step: 1332/530, loss: 0.004746435675770044 2023-01-24 07:11:20.033705: step: 1336/530, loss: 0.003821619786322117 2023-01-24 07:11:21.069117: step: 1340/530, loss: 0.0006737510557286441 2023-01-24 07:11:22.108538: step: 1344/530, loss: 0.015957266092300415 2023-01-24 07:11:23.147117: step: 1348/530, loss: 0.005501211155205965 2023-01-24 07:11:24.192559: step: 1352/530, loss: 0.0033074773382395506 2023-01-24 07:11:25.229807: step: 1356/530, loss: 0.0009623094229027629 2023-01-24 07:11:26.261108: step: 1360/530, loss: 0.000806731462944299 2023-01-24 07:11:27.313835: step: 1364/530, loss: 0.0020697119180113077 2023-01-24 07:11:28.358846: step: 1368/530, loss: 0.0010327850468456745 2023-01-24 07:11:29.384713: step: 1372/530, loss: 0.0012403945438563824 2023-01-24 07:11:30.436892: step: 1376/530, loss: 0.001363015966489911 2023-01-24 07:11:31.482718: step: 1380/530, loss: 0.0006392548675648868 2023-01-24 07:11:32.525139: step: 1384/530, loss: 0.0020197764970362186 2023-01-24 07:11:33.573283: step: 1388/530, loss: 0.0009072396787814796 2023-01-24 07:11:34.625476: step: 1392/530, loss: 0.0030043385922908783 2023-01-24 07:11:35.675335: step: 1396/530, loss: 0.009019937366247177 2023-01-24 07:11:36.723899: step: 1400/530, loss: 0.004924031440168619 2023-01-24 07:11:37.775264: step: 1404/530, loss: 0.010605115443468094 2023-01-24 07:11:38.845924: step: 1408/530, loss: 0.0039377338252961636 2023-01-24 07:11:39.891644: step: 1412/530, loss: 0.005646178964525461 2023-01-24 07:11:40.940896: step: 1416/530, loss: 0.0025246378500014544 2023-01-24 07:11:41.984132: step: 1420/530, loss: 0.0012028859928250313 2023-01-24 07:11:43.023759: step: 1424/530, loss: 0.0008891834877431393 2023-01-24 07:11:44.076509: step: 1428/530, loss: 0.003501572646200657 2023-01-24 07:11:45.111545: step: 1432/530, loss: 0.0033416440710425377 2023-01-24 07:11:46.151780: step: 1436/530, loss: 0.004756961949169636 2023-01-24 07:11:47.206953: step: 1440/530, loss: 0.0018819908145815134 2023-01-24 07:11:48.260079: step: 1444/530, loss: 0.002732961205765605 2023-01-24 07:11:49.310027: step: 1448/530, loss: 0.002800561022013426 2023-01-24 07:11:50.357985: step: 1452/530, loss: 0.0005214640987105668 2023-01-24 07:11:51.432230: step: 1456/530, loss: 0.006584409158676863 2023-01-24 07:11:52.474166: step: 1460/530, loss: 0.0034163668751716614 2023-01-24 07:11:53.531689: step: 1464/530, loss: 0.009226624853909016 2023-01-24 07:11:54.583001: step: 1468/530, loss: 0.00355134648270905 2023-01-24 07:11:55.630991: step: 1472/530, loss: 0.0009333228226751089 2023-01-24 07:11:56.671821: step: 1476/530, loss: 0.0017866671551018953 2023-01-24 07:11:57.714327: step: 1480/530, loss: 0.015849852934479713 2023-01-24 07:11:58.766644: step: 1484/530, loss: 0.0033516413532197475 2023-01-24 07:11:59.818861: step: 1488/530, loss: 0.0004385552601888776 2023-01-24 07:12:00.879502: step: 1492/530, loss: 0.003435111604630947 2023-01-24 07:12:01.928596: step: 1496/530, loss: 0.0068300343118608 2023-01-24 07:12:02.982978: step: 1500/530, loss: 0.0062282937578856945 2023-01-24 07:12:04.030166: step: 1504/530, loss: 0.007188333664089441 2023-01-24 07:12:05.061560: step: 1508/530, loss: 0.0021044963505119085 2023-01-24 07:12:06.100855: step: 1512/530, loss: 0.0014146534958854318 2023-01-24 07:12:07.140238: step: 1516/530, loss: 0.000188202437129803 2023-01-24 07:12:08.177148: step: 1520/530, loss: 0.0015249266289174557 2023-01-24 07:12:09.213579: step: 1524/530, loss: 0.019841352477669716 2023-01-24 07:12:10.262689: step: 1528/530, loss: 0.013087257742881775 2023-01-24 07:12:11.304670: step: 1532/530, loss: 0.0031631398014724255 2023-01-24 07:12:12.349194: step: 1536/530, loss: 0.004450693726539612 2023-01-24 07:12:13.394158: step: 1540/530, loss: 0.00632547028362751 2023-01-24 07:12:14.436892: step: 1544/530, loss: 0.0056480467319488525 2023-01-24 07:12:15.467842: step: 1548/530, loss: 0.017980292439460754 2023-01-24 07:12:16.506218: step: 1552/530, loss: 0.006080025341361761 2023-01-24 07:12:17.573720: step: 1556/530, loss: 0.002057814970612526 2023-01-24 07:12:18.615657: step: 1560/530, loss: 0.00877632386982441 2023-01-24 07:12:19.659617: step: 1564/530, loss: 1.4071784789848607e-05 2023-01-24 07:12:20.703221: step: 1568/530, loss: 0.003770629409700632 2023-01-24 07:12:21.735174: step: 1572/530, loss: 0.001053656218573451 2023-01-24 07:12:22.792486: step: 1576/530, loss: 0.0025587636046111584 2023-01-24 07:12:23.833600: step: 1580/530, loss: 0.005507788620889187 2023-01-24 07:12:24.880377: step: 1584/530, loss: 0.01527484506368637 2023-01-24 07:12:25.921127: step: 1588/530, loss: 0.01617465354502201 2023-01-24 07:12:26.963425: step: 1592/530, loss: 0.0035356669686734676 2023-01-24 07:12:28.013962: step: 1596/530, loss: 0.002311212010681629 2023-01-24 07:12:29.046085: step: 1600/530, loss: 0.0016364060575142503 2023-01-24 07:12:30.074535: step: 1604/530, loss: 0.0013877179007977247 2023-01-24 07:12:31.143320: step: 1608/530, loss: 0.0070881107822060585 2023-01-24 07:12:32.191633: step: 1612/530, loss: 1.250940294994507e-05 2023-01-24 07:12:33.244105: step: 1616/530, loss: 0.01038957666605711 2023-01-24 07:12:34.297077: step: 1620/530, loss: 0.001286824350245297 2023-01-24 07:12:35.358376: step: 1624/530, loss: 0.009222668595612049 2023-01-24 07:12:36.408109: step: 1628/530, loss: 0.0006454787217080593 2023-01-24 07:12:37.457918: step: 1632/530, loss: 0.006494362372905016 2023-01-24 07:12:38.492035: step: 1636/530, loss: 0.0015890697250142694 2023-01-24 07:12:39.541822: step: 1640/530, loss: 0.0045647588558495045 2023-01-24 07:12:40.579162: step: 1644/530, loss: 0.0002089084155159071 2023-01-24 07:12:41.634256: step: 1648/530, loss: 0.004456041846424341 2023-01-24 07:12:42.672827: step: 1652/530, loss: 0.00011728770914487541 2023-01-24 07:12:43.706902: step: 1656/530, loss: 0.002299683867022395 2023-01-24 07:12:44.742260: step: 1660/530, loss: 0.0023643369786441326 2023-01-24 07:12:45.771141: step: 1664/530, loss: 0.0036206389777362347 2023-01-24 07:12:46.833137: step: 1668/530, loss: 0.006230282597243786 2023-01-24 07:12:47.872995: step: 1672/530, loss: 0.0019537578336894512 2023-01-24 07:12:48.916613: step: 1676/530, loss: 6.323368870653212e-05 2023-01-24 07:12:49.978476: step: 1680/530, loss: 0.005761615000665188 2023-01-24 07:12:51.008460: step: 1684/530, loss: 0.00046067178482189775 2023-01-24 07:12:52.046898: step: 1688/530, loss: 0.0036656286101788282 2023-01-24 07:12:53.102291: step: 1692/530, loss: 0.012993012554943562 2023-01-24 07:12:54.142273: step: 1696/530, loss: 0.002271597972139716 2023-01-24 07:12:55.179786: step: 1700/530, loss: 0.0034315655939280987 2023-01-24 07:12:56.211120: step: 1704/530, loss: 0.0003701582318171859 2023-01-24 07:12:57.249706: step: 1708/530, loss: 0.014921503141522408 2023-01-24 07:12:58.277950: step: 1712/530, loss: 0.0035794973373413086 2023-01-24 07:12:59.301413: step: 1716/530, loss: 0.013946876861155033 2023-01-24 07:13:00.331575: step: 1720/530, loss: 0.004493516869843006 2023-01-24 07:13:01.370058: step: 1724/530, loss: 0.000817067688331008 2023-01-24 07:13:02.416540: step: 1728/530, loss: 0.006036113481968641 2023-01-24 07:13:03.471753: step: 1732/530, loss: 0.004596680868417025 2023-01-24 07:13:04.507895: step: 1736/530, loss: 0.0007401639595627785 2023-01-24 07:13:05.557903: step: 1740/530, loss: 0.006351632997393608 2023-01-24 07:13:06.606201: step: 1744/530, loss: 8.505427103955299e-05 2023-01-24 07:13:07.661345: step: 1748/530, loss: 0.00013968886923976243 2023-01-24 07:13:08.718760: step: 1752/530, loss: 0.004467634949833155 2023-01-24 07:13:09.754549: step: 1756/530, loss: 0.005428646225482225 2023-01-24 07:13:10.804949: step: 1760/530, loss: 0.027409780770540237 2023-01-24 07:13:11.840997: step: 1764/530, loss: 0.0029004737734794617 2023-01-24 07:13:12.865838: step: 1768/530, loss: 3.3422054457332706e-06 2023-01-24 07:13:13.917533: step: 1772/530, loss: 0.0032002448569983244 2023-01-24 07:13:14.964716: step: 1776/530, loss: 0.006825991906225681 2023-01-24 07:13:16.017483: step: 1780/530, loss: 0.014038383960723877 2023-01-24 07:13:17.064717: step: 1784/530, loss: 0.003744417568668723 2023-01-24 07:13:18.106414: step: 1788/530, loss: 0.004952542949467897 2023-01-24 07:13:19.151581: step: 1792/530, loss: 0.003103705821558833 2023-01-24 07:13:20.195641: step: 1796/530, loss: 0.01318169105798006 2023-01-24 07:13:21.234440: step: 1800/530, loss: 0.0002455712528899312 2023-01-24 07:13:22.270237: step: 1804/530, loss: 0.0026007883716374636 2023-01-24 07:13:23.332427: step: 1808/530, loss: 0.0029576849192380905 2023-01-24 07:13:24.374462: step: 1812/530, loss: 0.003828586544841528 2023-01-24 07:13:25.406010: step: 1816/530, loss: 0.004853245336562395 2023-01-24 07:13:26.434365: step: 1820/530, loss: 0.003916988614946604 2023-01-24 07:13:27.485628: step: 1824/530, loss: 0.0003066852514166385 2023-01-24 07:13:28.524638: step: 1828/530, loss: 0.004145803861320019 2023-01-24 07:13:29.573661: step: 1832/530, loss: 0.0013616053620353341 2023-01-24 07:13:30.629971: step: 1836/530, loss: 0.005522761959582567 2023-01-24 07:13:31.680012: step: 1840/530, loss: 0.0035444784443825483 2023-01-24 07:13:32.729240: step: 1844/530, loss: 0.0006922088796272874 2023-01-24 07:13:33.765326: step: 1848/530, loss: 0.00549279572442174 2023-01-24 07:13:34.806997: step: 1852/530, loss: 0.005062986630946398 2023-01-24 07:13:35.869149: step: 1856/530, loss: 0.0011594189563766122 2023-01-24 07:13:36.890309: step: 1860/530, loss: 8.112152136163786e-05 2023-01-24 07:13:37.938708: step: 1864/530, loss: 0.030368462204933167 2023-01-24 07:13:38.983629: step: 1868/530, loss: 0.005716988351196051 2023-01-24 07:13:40.011709: step: 1872/530, loss: 0.009531802497804165 2023-01-24 07:13:41.048966: step: 1876/530, loss: 0.003937490750104189 2023-01-24 07:13:42.076525: step: 1880/530, loss: 0.0015087856445461512 2023-01-24 07:13:43.111343: step: 1884/530, loss: 0.008050847798585892 2023-01-24 07:13:44.177559: step: 1888/530, loss: 0.013968897983431816 2023-01-24 07:13:45.233089: step: 1892/530, loss: 0.008272671140730381 2023-01-24 07:13:46.282176: step: 1896/530, loss: 0.0004494102322496474 2023-01-24 07:13:47.325354: step: 1900/530, loss: 0.0029197088442742825 2023-01-24 07:13:48.356858: step: 1904/530, loss: 0.0011335788294672966 2023-01-24 07:13:49.393218: step: 1908/530, loss: 0.020606601610779762 2023-01-24 07:13:50.431634: step: 1912/530, loss: 0.0009659072384238243 2023-01-24 07:13:51.468765: step: 1916/530, loss: 0.005238627549260855 2023-01-24 07:13:52.530639: step: 1920/530, loss: 0.03141063451766968 2023-01-24 07:13:53.583568: step: 1924/530, loss: 0.004119644407182932 2023-01-24 07:13:54.617605: step: 1928/530, loss: 0.004491072613745928 2023-01-24 07:13:55.662138: step: 1932/530, loss: 0.003926880192011595 2023-01-24 07:13:56.695150: step: 1936/530, loss: 0.0037270341999828815 2023-01-24 07:13:57.731021: step: 1940/530, loss: 0.00832485593855381 2023-01-24 07:13:58.779389: step: 1944/530, loss: 0.0034805391915142536 2023-01-24 07:13:59.840046: step: 1948/530, loss: 0.007315187249332666 2023-01-24 07:14:00.857528: step: 1952/530, loss: 0.007283097133040428 2023-01-24 07:14:01.906899: step: 1956/530, loss: 0.0072958446107804775 2023-01-24 07:14:02.991663: step: 1960/530, loss: 0.0042175170965492725 2023-01-24 07:14:04.021952: step: 1964/530, loss: 5.311781569616869e-05 2023-01-24 07:14:05.053495: step: 1968/530, loss: 0.0035744302440434694 2023-01-24 07:14:06.094477: step: 1972/530, loss: 0.0010876110754907131 2023-01-24 07:14:07.143212: step: 1976/530, loss: 0.002590608550235629 2023-01-24 07:14:08.199470: step: 1980/530, loss: 0.00675234803929925 2023-01-24 07:14:09.261983: step: 1984/530, loss: 0.02603055350482464 2023-01-24 07:14:10.297617: step: 1988/530, loss: 0.005563122685998678 2023-01-24 07:14:11.334594: step: 1992/530, loss: 0.00038442268851213157 2023-01-24 07:14:12.367406: step: 1996/530, loss: 0.000415379909100011 2023-01-24 07:14:13.394199: step: 2000/530, loss: 0.007721236906945705 2023-01-24 07:14:14.421327: step: 2004/530, loss: 0.005578874610364437 2023-01-24 07:14:15.472073: step: 2008/530, loss: 0.001538212993182242 2023-01-24 07:14:16.519132: step: 2012/530, loss: 0.0018273445311933756 2023-01-24 07:14:17.573452: step: 2016/530, loss: 0.0002353592572035268 2023-01-24 07:14:18.618825: step: 2020/530, loss: 0.003976296167820692 2023-01-24 07:14:19.655703: step: 2024/530, loss: 0.0030448297038674355 2023-01-24 07:14:20.726182: step: 2028/530, loss: 0.006004220340400934 2023-01-24 07:14:21.772239: step: 2032/530, loss: 0.0221035648137331 2023-01-24 07:14:22.810009: step: 2036/530, loss: 5.662008697981946e-05 2023-01-24 07:14:23.858666: step: 2040/530, loss: 0.008959939703345299 2023-01-24 07:14:24.892678: step: 2044/530, loss: 0.002308865077793598 2023-01-24 07:14:25.941846: step: 2048/530, loss: 0.004059710539877415 2023-01-24 07:14:26.999385: step: 2052/530, loss: 0.004756842274218798 2023-01-24 07:14:28.048687: step: 2056/530, loss: 0.0013233455829322338 2023-01-24 07:14:29.093897: step: 2060/530, loss: 0.008637331426143646 2023-01-24 07:14:30.149058: step: 2064/530, loss: 0.0036857964005321264 2023-01-24 07:14:31.187555: step: 2068/530, loss: 0.00605457928031683 2023-01-24 07:14:32.220291: step: 2072/530, loss: 0.011533870361745358 2023-01-24 07:14:33.256296: step: 2076/530, loss: 0.01579107902944088 2023-01-24 07:14:34.313292: step: 2080/530, loss: 0.0031185075640678406 2023-01-24 07:14:35.356823: step: 2084/530, loss: 0.0025394295807927847 2023-01-24 07:14:36.410500: step: 2088/530, loss: 0.002315706806257367 2023-01-24 07:14:37.476447: step: 2092/530, loss: 0.001849551685154438 2023-01-24 07:14:38.536761: step: 2096/530, loss: 0.010271499864757061 2023-01-24 07:14:39.575331: step: 2100/530, loss: 0.0006917126011103392 2023-01-24 07:14:40.604162: step: 2104/530, loss: 0.004060756415128708 2023-01-24 07:14:41.642803: step: 2108/530, loss: 0.0023847725242376328 2023-01-24 07:14:42.674493: step: 2112/530, loss: 0.002044428139925003 2023-01-24 07:14:43.728294: step: 2116/530, loss: 0.0037294221110641956 2023-01-24 07:14:44.776149: step: 2120/530, loss: 0.00868659932166338 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37029128959276014, 'r': 0.3105668880455408, 'f1': 0.3378095975232198}, 'combined': 0.24891233501710933, 'stategy': 1, 'epoch': 11} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3757979351116226, 'r': 0.389614035667197, 'f1': 0.3825812913410743}, 'combined': 0.296546264101694, 'stategy': 1, 'epoch': 11} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3907643182557762, 'r': 0.32551335050149094, 'f1': 0.3551667406092872}, 'combined': 0.2617018088700011, 'stategy': 1, 'epoch': 11} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37268956361895444, 'r': 0.3689215625161893, 'f1': 0.37079599077839626}, 'combined': 0.2874112464406708, 'stategy': 1, 'epoch': 11} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3806063888240557, 'r': 0.3257181809481008, 'f1': 0.35102961423241125}, 'combined': 0.25865339996072406, 'stategy': 1, 'epoch': 11} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3628740170616423, 'r': 0.3625404931489018, 'f1': 0.36270717843310823}, 'combined': 0.28114144931178725, 'stategy': 1, 'epoch': 11} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 11} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 11} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 11} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37704166666666666, 'r': 0.32195208728652747, 'f1': 0.3473259979529171}, 'combined': 0.25592441954425466, 'stategy': 1, 'epoch': 6} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37621134584593835, 'r': 0.3907342102995499, 'f1': 0.3833352757492428}, 'combined': 0.29713069220754706, 'stategy': 1, 'epoch': 6} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 6} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 12 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 07:17:09.702839: step: 4/530, loss: 0.0002098134864354506 2023-01-24 07:17:10.736148: step: 8/530, loss: 0.033779583871364594 2023-01-24 07:17:11.771893: step: 12/530, loss: 0.0023955267388373613 2023-01-24 07:17:12.811145: step: 16/530, loss: 0.000597143720369786 2023-01-24 07:17:13.856085: step: 20/530, loss: 0.0015304861590266228 2023-01-24 07:17:14.897862: step: 24/530, loss: 0.004038474056869745 2023-01-24 07:17:15.948006: step: 28/530, loss: 0.0035547122824937105 2023-01-24 07:17:17.005453: step: 32/530, loss: 8.435960626229644e-05 2023-01-24 07:17:18.038916: step: 36/530, loss: 6.203541943250457e-06 2023-01-24 07:17:19.101803: step: 40/530, loss: 0.006693084258586168 2023-01-24 07:17:20.160308: step: 44/530, loss: 0.013135098852217197 2023-01-24 07:17:21.225049: step: 48/530, loss: 0.0016470348928123713 2023-01-24 07:17:22.284955: step: 52/530, loss: 0.0039216866716742516 2023-01-24 07:17:23.327395: step: 56/530, loss: 9.481578672421165e-06 2023-01-24 07:17:24.384223: step: 60/530, loss: 0.0037431931123137474 2023-01-24 07:17:25.416675: step: 64/530, loss: 0.007498991210013628 2023-01-24 07:17:26.447886: step: 68/530, loss: 0.002700318116694689 2023-01-24 07:17:27.483527: step: 72/530, loss: 0.008197540417313576 2023-01-24 07:17:28.527267: step: 76/530, loss: 0.0007971164304763079 2023-01-24 07:17:29.544756: step: 80/530, loss: 0.0027596834115684032 2023-01-24 07:17:30.579563: step: 84/530, loss: 0.009794579818844795 2023-01-24 07:17:31.614143: step: 88/530, loss: 0.0028697459492832422 2023-01-24 07:17:32.652833: step: 92/530, loss: 0.009943623095750809 2023-01-24 07:17:33.719325: step: 96/530, loss: 0.03528591990470886 2023-01-24 07:17:34.757632: step: 100/530, loss: 0.0034879918675869703 2023-01-24 07:17:35.801216: step: 104/530, loss: 0.00262234965339303 2023-01-24 07:17:36.860791: step: 108/530, loss: 0.0032907037530094385 2023-01-24 07:17:37.923199: step: 112/530, loss: 0.00034220938687212765 2023-01-24 07:17:38.962998: step: 116/530, loss: 2.608080285426695e-05 2023-01-24 07:17:40.000417: step: 120/530, loss: 0.006654891185462475 2023-01-24 07:17:41.043460: step: 124/530, loss: 0.003869660198688507 2023-01-24 07:17:42.077420: step: 128/530, loss: 0.0020381638314574957 2023-01-24 07:17:43.122442: step: 132/530, loss: 0.0001978184300241992 2023-01-24 07:17:44.169410: step: 136/530, loss: 0.00815041083842516 2023-01-24 07:17:45.215184: step: 140/530, loss: 0.0018543227342888713 2023-01-24 07:17:46.270014: step: 144/530, loss: 0.0017679610755294561 2023-01-24 07:17:47.355032: step: 148/530, loss: 0.002873451681807637 2023-01-24 07:17:48.410948: step: 152/530, loss: 0.0010104554239660501 2023-01-24 07:17:49.454655: step: 156/530, loss: 0.001551167108118534 2023-01-24 07:17:50.516057: step: 160/530, loss: 0.0031594280153512955 2023-01-24 07:17:51.560928: step: 164/530, loss: 0.011970771476626396 2023-01-24 07:17:52.627355: step: 168/530, loss: 0.009992629289627075 2023-01-24 07:17:53.663336: step: 172/530, loss: 0.004959688056260347 2023-01-24 07:17:54.708945: step: 176/530, loss: 0.001493844436481595 2023-01-24 07:17:55.791659: step: 180/530, loss: 0.007817437872290611 2023-01-24 07:17:56.823562: step: 184/530, loss: 0.002572344383224845 2023-01-24 07:17:57.866932: step: 188/530, loss: 0.0009903431637212634 2023-01-24 07:17:58.915653: step: 192/530, loss: 0.0005465737194754183 2023-01-24 07:17:59.960203: step: 196/530, loss: 0.002872624434530735 2023-01-24 07:18:01.008026: step: 200/530, loss: 0.0024414220824837685 2023-01-24 07:18:02.059629: step: 204/530, loss: 0.0009540935861878097 2023-01-24 07:18:03.108389: step: 208/530, loss: 0.0010491018183529377 2023-01-24 07:18:04.156069: step: 212/530, loss: 0.0054084244184195995 2023-01-24 07:18:05.201396: step: 216/530, loss: 2.3314871214097366e-05 2023-01-24 07:18:06.261469: step: 220/530, loss: 0.005042777396738529 2023-01-24 07:18:07.311292: step: 224/530, loss: 0.001870562438853085 2023-01-24 07:18:08.367437: step: 228/530, loss: 0.010852418839931488 2023-01-24 07:18:09.418507: step: 232/530, loss: 0.006877579260617495 2023-01-24 07:18:10.456758: step: 236/530, loss: 0.0007135175983421504 2023-01-24 07:18:11.499545: step: 240/530, loss: 0.0014545349404215813 2023-01-24 07:18:12.564328: step: 244/530, loss: 0.0016862108604982495 2023-01-24 07:18:13.630103: step: 248/530, loss: 0.0029115641955286264 2023-01-24 07:18:14.676441: step: 252/530, loss: 0.0021626609377563 2023-01-24 07:18:15.729201: step: 256/530, loss: 0.005136611871421337 2023-01-24 07:18:16.766109: step: 260/530, loss: 0.012904365547001362 2023-01-24 07:18:17.817443: step: 264/530, loss: 0.005243342369794846 2023-01-24 07:18:18.873617: step: 268/530, loss: 3.0413202694035135e-06 2023-01-24 07:18:19.929565: step: 272/530, loss: 0.005616612732410431 2023-01-24 07:18:20.990333: step: 276/530, loss: 0.0077189975418150425 2023-01-24 07:18:22.038991: step: 280/530, loss: 0.0020084225106984377 2023-01-24 07:18:23.061769: step: 284/530, loss: 0.000200699592824094 2023-01-24 07:18:24.107684: step: 288/530, loss: 0.0007427338277921081 2023-01-24 07:18:25.149267: step: 292/530, loss: 0.0035736786667257547 2023-01-24 07:18:26.213902: step: 296/530, loss: 0.0026529652532190084 2023-01-24 07:18:27.262523: step: 300/530, loss: 0.0012337294174358249 2023-01-24 07:18:28.317592: step: 304/530, loss: 0.00526558980345726 2023-01-24 07:18:29.363517: step: 308/530, loss: 0.002192672109231353 2023-01-24 07:18:30.415742: step: 312/530, loss: 0.0008886989089660347 2023-01-24 07:18:31.470352: step: 316/530, loss: 0.003497776575386524 2023-01-24 07:18:32.518192: step: 320/530, loss: 0.0018555395072326064 2023-01-24 07:18:33.563248: step: 324/530, loss: 0.004081949591636658 2023-01-24 07:18:34.618137: step: 328/530, loss: 0.0022255147341638803 2023-01-24 07:18:35.669276: step: 332/530, loss: 0.00015214842278510332 2023-01-24 07:18:36.736515: step: 336/530, loss: 0.0017819913337007165 2023-01-24 07:18:37.787739: step: 340/530, loss: 0.0015917300479486585 2023-01-24 07:18:38.839996: step: 344/530, loss: 0.00018158002058044076 2023-01-24 07:18:39.877540: step: 348/530, loss: 0.00040777577669359744 2023-01-24 07:18:40.935039: step: 352/530, loss: 0.0012022678274661303 2023-01-24 07:18:41.961209: step: 356/530, loss: 0.008302228525280952 2023-01-24 07:18:43.008445: step: 360/530, loss: 0.002529502846300602 2023-01-24 07:18:44.055774: step: 364/530, loss: 0.0023683158215135336 2023-01-24 07:18:45.103120: step: 368/530, loss: 0.015279468148946762 2023-01-24 07:18:46.152648: step: 372/530, loss: 0.0036307775881141424 2023-01-24 07:18:47.218019: step: 376/530, loss: 0.003783815773203969 2023-01-24 07:18:48.258252: step: 380/530, loss: 0.004744145553559065 2023-01-24 07:18:49.311046: step: 384/530, loss: 0.001663829549215734 2023-01-24 07:18:50.378396: step: 388/530, loss: 0.0013454323634505272 2023-01-24 07:18:51.424072: step: 392/530, loss: 0.002568910364061594 2023-01-24 07:18:52.472275: step: 396/530, loss: 0.011700435541570187 2023-01-24 07:18:53.519856: step: 400/530, loss: 0.0002411395835224539 2023-01-24 07:18:54.575711: step: 404/530, loss: 0.007561087608337402 2023-01-24 07:18:55.608916: step: 408/530, loss: 7.613570573994366e-07 2023-01-24 07:18:56.648498: step: 412/530, loss: 6.0423910326790065e-05 2023-01-24 07:18:57.706227: step: 416/530, loss: 0.005288333166390657 2023-01-24 07:18:58.753950: step: 420/530, loss: 0.0037153270095586777 2023-01-24 07:18:59.790320: step: 424/530, loss: 0.004138066899031401 2023-01-24 07:19:00.833982: step: 428/530, loss: 0.011536558158695698 2023-01-24 07:19:01.872089: step: 432/530, loss: 0.000436519825598225 2023-01-24 07:19:02.946197: step: 436/530, loss: 0.006147042382508516 2023-01-24 07:19:03.997814: step: 440/530, loss: 0.0058008343912661076 2023-01-24 07:19:05.029998: step: 444/530, loss: 5.1854538469342515e-05 2023-01-24 07:19:06.084169: step: 448/530, loss: 0.0025187800638377666 2023-01-24 07:19:07.161288: step: 452/530, loss: 0.006841473747044802 2023-01-24 07:19:08.210197: step: 456/530, loss: 0.00014648000069428235 2023-01-24 07:19:09.251584: step: 460/530, loss: 6.161403871374205e-05 2023-01-24 07:19:10.296051: step: 464/530, loss: 0.004762462805956602 2023-01-24 07:19:11.348532: step: 468/530, loss: 0.004971724934875965 2023-01-24 07:19:12.418097: step: 472/530, loss: 0.0063550760969519615 2023-01-24 07:19:13.453700: step: 476/530, loss: 0.00108983158133924 2023-01-24 07:19:14.500867: step: 480/530, loss: 0.0016724548768252134 2023-01-24 07:19:15.543902: step: 484/530, loss: 0.00010766657942440361 2023-01-24 07:19:16.586376: step: 488/530, loss: 0.011752878315746784 2023-01-24 07:19:17.649881: step: 492/530, loss: 0.0019836928695440292 2023-01-24 07:19:18.710002: step: 496/530, loss: 0.001976546598598361 2023-01-24 07:19:19.774360: step: 500/530, loss: 0.004593879450112581 2023-01-24 07:19:20.825580: step: 504/530, loss: 0.0018722822424024343 2023-01-24 07:19:21.887701: step: 508/530, loss: 0.0005927394377067685 2023-01-24 07:19:22.935694: step: 512/530, loss: 0.004643979016691446 2023-01-24 07:19:23.972503: step: 516/530, loss: 0.0007006069645285606 2023-01-24 07:19:25.014238: step: 520/530, loss: 0.004949643276631832 2023-01-24 07:19:26.070315: step: 524/530, loss: 0.009754087775945663 2023-01-24 07:19:27.120001: step: 528/530, loss: 0.004312986508011818 2023-01-24 07:19:28.164326: step: 532/530, loss: 0.009008606895804405 2023-01-24 07:19:29.207822: step: 536/530, loss: 0.0003606323734857142 2023-01-24 07:19:30.267545: step: 540/530, loss: 0.0027230042032897472 2023-01-24 07:19:31.311086: step: 544/530, loss: 0.013823960907757282 2023-01-24 07:19:32.373630: step: 548/530, loss: 0.015406623482704163 2023-01-24 07:19:33.422545: step: 552/530, loss: 0.0053239911794662476 2023-01-24 07:19:34.466789: step: 556/530, loss: 0.017090929672122 2023-01-24 07:19:35.530807: step: 560/530, loss: 0.005778525024652481 2023-01-24 07:19:36.580026: step: 564/530, loss: 0.006856540683656931 2023-01-24 07:19:37.636281: step: 568/530, loss: 0.003494675038382411 2023-01-24 07:19:38.678279: step: 572/530, loss: 0.0002908333844970912 2023-01-24 07:19:39.724544: step: 576/530, loss: 0.00804196111857891 2023-01-24 07:19:40.770978: step: 580/530, loss: 0.003090738086029887 2023-01-24 07:19:41.817391: step: 584/530, loss: 0.004739857278764248 2023-01-24 07:19:42.872167: step: 588/530, loss: 0.005519860424101353 2023-01-24 07:19:43.915247: step: 592/530, loss: 0.0008785635000094771 2023-01-24 07:19:44.969008: step: 596/530, loss: 0.008111746981739998 2023-01-24 07:19:46.020701: step: 600/530, loss: 0.014484434388577938 2023-01-24 07:19:47.069398: step: 604/530, loss: 0.005458177998661995 2023-01-24 07:19:48.115685: step: 608/530, loss: 0.002368542132899165 2023-01-24 07:19:49.165137: step: 612/530, loss: 0.0012129952665418386 2023-01-24 07:19:50.211620: step: 616/530, loss: 0.00016289466293528676 2023-01-24 07:19:51.257059: step: 620/530, loss: 0.0018954677507281303 2023-01-24 07:19:52.309801: step: 624/530, loss: 0.007410240825265646 2023-01-24 07:19:53.367407: step: 628/530, loss: 0.0035863411612808704 2023-01-24 07:19:54.419886: step: 632/530, loss: 0.00589687330648303 2023-01-24 07:19:55.475047: step: 636/530, loss: 0.0027452362701296806 2023-01-24 07:19:56.512587: step: 640/530, loss: 0.0008080213447101414 2023-01-24 07:19:57.561052: step: 644/530, loss: 0.0007217864622361958 2023-01-24 07:19:58.610937: step: 648/530, loss: 0.005689879413694143 2023-01-24 07:19:59.666604: step: 652/530, loss: 5.123640221427195e-05 2023-01-24 07:20:00.720708: step: 656/530, loss: 0.004865794442594051 2023-01-24 07:20:01.767042: step: 660/530, loss: 3.063065742026083e-05 2023-01-24 07:20:02.825413: step: 664/530, loss: 0.0009470180375501513 2023-01-24 07:20:03.887013: step: 668/530, loss: 0.002904303604736924 2023-01-24 07:20:04.943142: step: 672/530, loss: 0.006766879931092262 2023-01-24 07:20:05.973892: step: 676/530, loss: 0.0010938975028693676 2023-01-24 07:20:07.005080: step: 680/530, loss: 0.0005955899832770228 2023-01-24 07:20:08.061010: step: 684/530, loss: 0.011389659717679024 2023-01-24 07:20:09.104143: step: 688/530, loss: 0.0029171837959438562 2023-01-24 07:20:10.135356: step: 692/530, loss: 0.00016324837633874267 2023-01-24 07:20:11.179161: step: 696/530, loss: 0.0028112668078392744 2023-01-24 07:20:12.206624: step: 700/530, loss: 0.0013409480452537537 2023-01-24 07:20:13.255087: step: 704/530, loss: 0.008898143656551838 2023-01-24 07:20:14.306283: step: 708/530, loss: 0.004181708209216595 2023-01-24 07:20:15.353910: step: 712/530, loss: 0.0019403608748689294 2023-01-24 07:20:16.391495: step: 716/530, loss: 0.004969300702214241 2023-01-24 07:20:17.434230: step: 720/530, loss: 0.00036568247014656663 2023-01-24 07:20:18.492646: step: 724/530, loss: 0.0012061306042596698 2023-01-24 07:20:19.556030: step: 728/530, loss: 0.0020278675947338343 2023-01-24 07:20:20.596132: step: 732/530, loss: 0.001116099301725626 2023-01-24 07:20:21.636717: step: 736/530, loss: 0.0037191968876868486 2023-01-24 07:20:22.682860: step: 740/530, loss: 0.008039727807044983 2023-01-24 07:20:23.722873: step: 744/530, loss: 2.126537037838716e-05 2023-01-24 07:20:24.772929: step: 748/530, loss: 0.002352700103074312 2023-01-24 07:20:25.798588: step: 752/530, loss: 0.023162314668297768 2023-01-24 07:20:26.862789: step: 756/530, loss: 0.003155795158818364 2023-01-24 07:20:27.915853: step: 760/530, loss: 0.0060104867443442345 2023-01-24 07:20:28.968040: step: 764/530, loss: 0.006539924070239067 2023-01-24 07:20:30.008773: step: 768/530, loss: 0.031132902950048447 2023-01-24 07:20:31.064213: step: 772/530, loss: 7.505480607505888e-05 2023-01-24 07:20:32.131102: step: 776/530, loss: 0.012613949365913868 2023-01-24 07:20:33.186056: step: 780/530, loss: 0.01499087642878294 2023-01-24 07:20:34.238703: step: 784/530, loss: 0.010055623017251492 2023-01-24 07:20:35.275603: step: 788/530, loss: 0.001072186278179288 2023-01-24 07:20:36.311442: step: 792/530, loss: 0.002134459326043725 2023-01-24 07:20:37.366514: step: 796/530, loss: 0.0011044758139178157 2023-01-24 07:20:38.421506: step: 800/530, loss: 0.00104897515848279 2023-01-24 07:20:39.453364: step: 804/530, loss: 0.003274880815297365 2023-01-24 07:20:40.496712: step: 808/530, loss: 0.00865128356963396 2023-01-24 07:20:41.536560: step: 812/530, loss: 0.006183304358273745 2023-01-24 07:20:42.580824: step: 816/530, loss: 0.00017106109589803964 2023-01-24 07:20:43.623660: step: 820/530, loss: 0.00031705936999060214 2023-01-24 07:20:44.655565: step: 824/530, loss: 0.0022580043878406286 2023-01-24 07:20:45.712159: step: 828/530, loss: 9.106863581109792e-05 2023-01-24 07:20:46.748172: step: 832/530, loss: 0.0025899119209498167 2023-01-24 07:20:47.796190: step: 836/530, loss: 0.004209454637020826 2023-01-24 07:20:48.849052: step: 840/530, loss: 0.0011600167490541935 2023-01-24 07:20:49.889920: step: 844/530, loss: 0.012773072347044945 2023-01-24 07:20:50.931523: step: 848/530, loss: 6.810516788391396e-05 2023-01-24 07:20:51.978114: step: 852/530, loss: 0.0033851061016321182 2023-01-24 07:20:53.022364: step: 856/530, loss: 1.8227445252705365e-05 2023-01-24 07:20:54.088122: step: 860/530, loss: 0.0021093892864882946 2023-01-24 07:20:55.146093: step: 864/530, loss: 0.0023472122848033905 2023-01-24 07:20:56.192353: step: 868/530, loss: 0.003328170860186219 2023-01-24 07:20:57.234821: step: 872/530, loss: 0.0007086084224283695 2023-01-24 07:20:58.260776: step: 876/530, loss: 0.0012577767483890057 2023-01-24 07:20:59.289616: step: 880/530, loss: 0.002273960504680872 2023-01-24 07:21:00.321640: step: 884/530, loss: 0.0019835445564240217 2023-01-24 07:21:01.379985: step: 888/530, loss: 0.00939200259745121 2023-01-24 07:21:02.425451: step: 892/530, loss: 0.001002413802780211 2023-01-24 07:21:03.477298: step: 896/530, loss: 0.002918391954153776 2023-01-24 07:21:04.521931: step: 900/530, loss: 0.006270183715969324 2023-01-24 07:21:05.538838: step: 904/530, loss: 0.0003226775152143091 2023-01-24 07:21:06.581626: step: 908/530, loss: 0.0002985780010931194 2023-01-24 07:21:07.634977: step: 912/530, loss: 0.00126753025688231 2023-01-24 07:21:08.674877: step: 916/530, loss: 0.002424656180664897 2023-01-24 07:21:09.710405: step: 920/530, loss: 0.001331451116129756 2023-01-24 07:21:10.745842: step: 924/530, loss: 0.0037289857864379883 2023-01-24 07:21:11.816850: step: 928/530, loss: 0.008709922432899475 2023-01-24 07:21:12.855652: step: 932/530, loss: 4.713838643510826e-05 2023-01-24 07:21:13.907064: step: 936/530, loss: 0.0006879171123728156 2023-01-24 07:21:14.954927: step: 940/530, loss: 0.0015554639976471663 2023-01-24 07:21:15.990186: step: 944/530, loss: 0.006880404427647591 2023-01-24 07:21:17.032537: step: 948/530, loss: 0.002029820578172803 2023-01-24 07:21:18.076327: step: 952/530, loss: 0.005209110211580992 2023-01-24 07:21:19.139784: step: 956/530, loss: 0.006262167356908321 2023-01-24 07:21:20.201332: step: 960/530, loss: 0.0005445873248390853 2023-01-24 07:21:21.249419: step: 964/530, loss: 0.009287801571190357 2023-01-24 07:21:22.282007: step: 968/530, loss: 0.0017832937883213162 2023-01-24 07:21:23.335935: step: 972/530, loss: 0.0066197956912219524 2023-01-24 07:21:24.377684: step: 976/530, loss: 0.0031681323889642954 2023-01-24 07:21:25.434349: step: 980/530, loss: 0.00193797389511019 2023-01-24 07:21:26.472890: step: 984/530, loss: 0.0006818838883191347 2023-01-24 07:21:27.528841: step: 988/530, loss: 0.005947432946413755 2023-01-24 07:21:28.586986: step: 992/530, loss: 0.00014374639431480318 2023-01-24 07:21:29.618948: step: 996/530, loss: 0.0027578489389270544 2023-01-24 07:21:30.681253: step: 1000/530, loss: 0.00670988904312253 2023-01-24 07:21:31.743932: step: 1004/530, loss: 0.0037533906288444996 2023-01-24 07:21:32.790965: step: 1008/530, loss: 0.007830151356756687 2023-01-24 07:21:33.825922: step: 1012/530, loss: 0.0010340377921238542 2023-01-24 07:21:34.877536: step: 1016/530, loss: 0.0038095011841505766 2023-01-24 07:21:35.908138: step: 1020/530, loss: 0.00020850585133302957 2023-01-24 07:21:36.943431: step: 1024/530, loss: 0.0 2023-01-24 07:21:37.985730: step: 1028/530, loss: 0.014278216287493706 2023-01-24 07:21:39.036908: step: 1032/530, loss: 0.001539278426207602 2023-01-24 07:21:40.066770: step: 1036/530, loss: 0.004220576956868172 2023-01-24 07:21:41.119532: step: 1040/530, loss: 0.006350742653012276 2023-01-24 07:21:42.173467: step: 1044/530, loss: 0.002821509260684252 2023-01-24 07:21:43.231865: step: 1048/530, loss: 0.002168116858229041 2023-01-24 07:21:44.272698: step: 1052/530, loss: 0.0009608911350369453 2023-01-24 07:21:45.317916: step: 1056/530, loss: 0.0005167686031199992 2023-01-24 07:21:46.378536: step: 1060/530, loss: 0.00890722218900919 2023-01-24 07:21:47.425030: step: 1064/530, loss: 0.002377914497628808 2023-01-24 07:21:48.481647: step: 1068/530, loss: 0.005166775081306696 2023-01-24 07:21:49.539475: step: 1072/530, loss: 0.004172053653746843 2023-01-24 07:21:50.624213: step: 1076/530, loss: 0.0006449891370721161 2023-01-24 07:21:51.659265: step: 1080/530, loss: 0.001498655998148024 2023-01-24 07:21:52.711301: step: 1084/530, loss: 0.005240730941295624 2023-01-24 07:21:53.757198: step: 1088/530, loss: 0.0029189996421337128 2023-01-24 07:21:54.801634: step: 1092/530, loss: 0.0036901573184877634 2023-01-24 07:21:55.840345: step: 1096/530, loss: 0.0030313222669065 2023-01-24 07:21:56.879985: step: 1100/530, loss: 0.0019233659841120243 2023-01-24 07:21:57.935732: step: 1104/530, loss: 0.0004474167653825134 2023-01-24 07:21:59.000352: step: 1108/530, loss: 0.00304612098261714 2023-01-24 07:22:00.054347: step: 1112/530, loss: 0.008172928355634212 2023-01-24 07:22:01.118328: step: 1116/530, loss: 0.0007721254951320589 2023-01-24 07:22:02.169786: step: 1120/530, loss: 9.270858572563156e-05 2023-01-24 07:22:03.241440: step: 1124/530, loss: 0.0010874532163143158 2023-01-24 07:22:04.324788: step: 1128/530, loss: 0.009353571571409702 2023-01-24 07:22:05.367637: step: 1132/530, loss: 0.007798335049301386 2023-01-24 07:22:06.405670: step: 1136/530, loss: 1.560855162097141e-05 2023-01-24 07:22:07.438313: step: 1140/530, loss: 0.0004388349479995668 2023-01-24 07:22:08.499579: step: 1144/530, loss: 0.0017336965538561344 2023-01-24 07:22:09.545436: step: 1148/530, loss: 0.0002440254029352218 2023-01-24 07:22:10.571629: step: 1152/530, loss: 0.013340502977371216 2023-01-24 07:22:11.613511: step: 1156/530, loss: 0.025634698569774628 2023-01-24 07:22:12.670246: step: 1160/530, loss: 0.008832289837300777 2023-01-24 07:22:13.722088: step: 1164/530, loss: 0.0037085632793605328 2023-01-24 07:22:14.747440: step: 1168/530, loss: 0.002268877113237977 2023-01-24 07:22:15.797122: step: 1172/530, loss: 0.002775707747787237 2023-01-24 07:22:16.871112: step: 1176/530, loss: 0.005364735145121813 2023-01-24 07:22:17.911745: step: 1180/530, loss: 0.0016359073342755437 2023-01-24 07:22:18.943944: step: 1184/530, loss: 0.00252917455509305 2023-01-24 07:22:19.985578: step: 1188/530, loss: 0.0025797623675316572 2023-01-24 07:22:21.034490: step: 1192/530, loss: 0.0 2023-01-24 07:22:22.107667: step: 1196/530, loss: 0.007662640418857336 2023-01-24 07:22:23.163854: step: 1200/530, loss: 0.005358402151614428 2023-01-24 07:22:24.210716: step: 1204/530, loss: 0.0046693007461726665 2023-01-24 07:22:25.261945: step: 1208/530, loss: 0.006806109566241503 2023-01-24 07:22:26.305924: step: 1212/530, loss: 0.003967630676925182 2023-01-24 07:22:27.333200: step: 1216/530, loss: 0.001612030086107552 2023-01-24 07:22:28.383320: step: 1220/530, loss: 0.0044658915139734745 2023-01-24 07:22:29.426001: step: 1224/530, loss: 0.004679975565522909 2023-01-24 07:22:30.462152: step: 1228/530, loss: 8.977941615739837e-05 2023-01-24 07:22:31.478283: step: 1232/530, loss: 0.0017979200929403305 2023-01-24 07:22:32.527588: step: 1236/530, loss: 0.0020674855913966894 2023-01-24 07:22:33.590851: step: 1240/530, loss: 0.0010735800024122 2023-01-24 07:22:34.620113: step: 1244/530, loss: 0.0045592705719172955 2023-01-24 07:22:35.666421: step: 1248/530, loss: 0.00034399895230308175 2023-01-24 07:22:36.711284: step: 1252/530, loss: 0.0008495797519572079 2023-01-24 07:22:37.758621: step: 1256/530, loss: 0.0054959505796432495 2023-01-24 07:22:38.816684: step: 1260/530, loss: 0.0004950312431901693 2023-01-24 07:22:39.862073: step: 1264/530, loss: 0.008217941038310528 2023-01-24 07:22:40.897637: step: 1268/530, loss: 0.007245768792927265 2023-01-24 07:22:41.949334: step: 1272/530, loss: 0.0027825292199850082 2023-01-24 07:22:42.988733: step: 1276/530, loss: 0.005645498633384705 2023-01-24 07:22:44.039767: step: 1280/530, loss: 0.0021553447004407644 2023-01-24 07:22:45.088926: step: 1284/530, loss: 0.003945991396903992 2023-01-24 07:22:46.125234: step: 1288/530, loss: 0.004809791687875986 2023-01-24 07:22:47.168756: step: 1292/530, loss: 0.002229788340628147 2023-01-24 07:22:48.205419: step: 1296/530, loss: 0.005427020136266947 2023-01-24 07:22:49.242823: step: 1300/530, loss: 0.004163031466305256 2023-01-24 07:22:50.277280: step: 1304/530, loss: 0.0010832385160028934 2023-01-24 07:22:51.336764: step: 1308/530, loss: 0.003033717628568411 2023-01-24 07:22:52.387138: step: 1312/530, loss: 0.014169587753713131 2023-01-24 07:22:53.438379: step: 1316/530, loss: 0.009973904117941856 2023-01-24 07:22:54.484900: step: 1320/530, loss: 0.006365509703755379 2023-01-24 07:22:55.515717: step: 1324/530, loss: 0.004413762129843235 2023-01-24 07:22:56.597705: step: 1328/530, loss: 0.003817374352365732 2023-01-24 07:22:57.649016: step: 1332/530, loss: 0.00264952564612031 2023-01-24 07:22:58.698067: step: 1336/530, loss: 0.0036176862195134163 2023-01-24 07:22:59.743298: step: 1340/530, loss: 0.001303567667491734 2023-01-24 07:23:00.780236: step: 1344/530, loss: 0.008924799039959908 2023-01-24 07:23:01.815914: step: 1348/530, loss: 0.009997577406466007 2023-01-24 07:23:02.865292: step: 1352/530, loss: 0.005217531230300665 2023-01-24 07:23:03.914509: step: 1356/530, loss: 0.004641849081963301 2023-01-24 07:23:04.969086: step: 1360/530, loss: 0.0008019140805117786 2023-01-24 07:23:06.022164: step: 1364/530, loss: 0.003105561016127467 2023-01-24 07:23:07.079536: step: 1368/530, loss: 0.004437734838575125 2023-01-24 07:23:08.129798: step: 1372/530, loss: 0.001108279568143189 2023-01-24 07:23:09.180097: step: 1376/530, loss: 0.0011244243942201138 2023-01-24 07:23:10.240067: step: 1380/530, loss: 0.0003110711113549769 2023-01-24 07:23:11.273440: step: 1384/530, loss: 0.0006829272606410086 2023-01-24 07:23:12.316207: step: 1388/530, loss: 0.0016583200776949525 2023-01-24 07:23:13.350648: step: 1392/530, loss: 0.001666699186898768 2023-01-24 07:23:14.392572: step: 1396/530, loss: 0.0020556470844894648 2023-01-24 07:23:15.425817: step: 1400/530, loss: 0.0001240190613316372 2023-01-24 07:23:16.471718: step: 1404/530, loss: 3.0134942790027708e-05 2023-01-24 07:23:17.520110: step: 1408/530, loss: 0.009231225587427616 2023-01-24 07:23:18.568752: step: 1412/530, loss: 0.0013545748079195619 2023-01-24 07:23:19.597901: step: 1416/530, loss: 2.4635108275106177e-05 2023-01-24 07:23:20.640725: step: 1420/530, loss: 0.013833350501954556 2023-01-24 07:23:21.685270: step: 1424/530, loss: 0.0015261200023815036 2023-01-24 07:23:22.722674: step: 1428/530, loss: 0.006960385479032993 2023-01-24 07:23:23.771217: step: 1432/530, loss: 1.0679212891773204e-06 2023-01-24 07:23:24.802314: step: 1436/530, loss: 0.010158493183553219 2023-01-24 07:23:25.838712: step: 1440/530, loss: 0.00017221782763954252 2023-01-24 07:23:26.873433: step: 1444/530, loss: 0.0034154686145484447 2023-01-24 07:23:27.921032: step: 1448/530, loss: 0.00013024620420765132 2023-01-24 07:23:28.971240: step: 1452/530, loss: 0.03434533625841141 2023-01-24 07:23:30.006666: step: 1456/530, loss: 0.00020123642752878368 2023-01-24 07:23:31.045682: step: 1460/530, loss: 0.010088873095810413 2023-01-24 07:23:32.100201: step: 1464/530, loss: 0.004612664692103863 2023-01-24 07:23:33.164615: step: 1468/530, loss: 0.03448980674147606 2023-01-24 07:23:34.193764: step: 1472/530, loss: 0.0001364069030387327 2023-01-24 07:23:35.231096: step: 1476/530, loss: 0.006621548905968666 2023-01-24 07:23:36.275181: step: 1480/530, loss: 0.0016558353090658784 2023-01-24 07:23:37.322523: step: 1484/530, loss: 0.0005234894924797118 2023-01-24 07:23:38.372164: step: 1488/530, loss: 0.010724452324211597 2023-01-24 07:23:39.418639: step: 1492/530, loss: 0.00606974633410573 2023-01-24 07:23:40.457524: step: 1496/530, loss: 0.00652778334915638 2023-01-24 07:23:41.493785: step: 1500/530, loss: 0.0005637799040414393 2023-01-24 07:23:42.550212: step: 1504/530, loss: 0.001750711351633072 2023-01-24 07:23:43.573327: step: 1508/530, loss: 0.008610162883996964 2023-01-24 07:23:44.616354: step: 1512/530, loss: 0.00014456934877671301 2023-01-24 07:23:45.672101: step: 1516/530, loss: 0.0009633276495151222 2023-01-24 07:23:46.710348: step: 1520/530, loss: 0.0002715626615099609 2023-01-24 07:23:47.756141: step: 1524/530, loss: 0.016622448340058327 2023-01-24 07:23:48.803453: step: 1528/530, loss: 0.018680144101381302 2023-01-24 07:23:49.847811: step: 1532/530, loss: 0.00033977319253608584 2023-01-24 07:23:50.890782: step: 1536/530, loss: 0.006149570923298597 2023-01-24 07:23:51.930377: step: 1540/530, loss: 0.005944901145994663 2023-01-24 07:23:52.963032: step: 1544/530, loss: 0.0068020387552678585 2023-01-24 07:23:53.999448: step: 1548/530, loss: 0.006000378634780645 2023-01-24 07:23:55.050290: step: 1552/530, loss: 0.005835102871060371 2023-01-24 07:23:56.081604: step: 1556/530, loss: 0.001768456189893186 2023-01-24 07:23:57.132237: step: 1560/530, loss: 0.0017500862013548613 2023-01-24 07:23:58.181660: step: 1564/530, loss: 0.004923265427350998 2023-01-24 07:23:59.230431: step: 1568/530, loss: 0.0028214200865477324 2023-01-24 07:24:00.259684: step: 1572/530, loss: 2.5458388336119242e-05 2023-01-24 07:24:01.299694: step: 1576/530, loss: 0.0007640895782969892 2023-01-24 07:24:02.331288: step: 1580/530, loss: 0.0015298749785870314 2023-01-24 07:24:03.382704: step: 1584/530, loss: 0.0024504277389496565 2023-01-24 07:24:04.410575: step: 1588/530, loss: 0.0002578197745606303 2023-01-24 07:24:05.459255: step: 1592/530, loss: 0.006138334050774574 2023-01-24 07:24:06.494358: step: 1596/530, loss: 0.000377841352019459 2023-01-24 07:24:07.528917: step: 1600/530, loss: 0.01051326934248209 2023-01-24 07:24:08.564510: step: 1604/530, loss: 0.0025168282445520163 2023-01-24 07:24:09.630111: step: 1608/530, loss: 0.0026044489350169897 2023-01-24 07:24:10.676889: step: 1612/530, loss: 0.00027407993911765516 2023-01-24 07:24:11.712069: step: 1616/530, loss: 0.012971087358891964 2023-01-24 07:24:12.745112: step: 1620/530, loss: 0.00045866359141655266 2023-01-24 07:24:13.788418: step: 1624/530, loss: 0.001111815683543682 2023-01-24 07:24:14.824491: step: 1628/530, loss: 0.004980051424354315 2023-01-24 07:24:15.863648: step: 1632/530, loss: 0.0003353085194248706 2023-01-24 07:24:16.905892: step: 1636/530, loss: 0.0007205993169918656 2023-01-24 07:24:17.959651: step: 1640/530, loss: 0.004817973356693983 2023-01-24 07:24:18.988662: step: 1644/530, loss: 0.002096210839226842 2023-01-24 07:24:20.029283: step: 1648/530, loss: 0.0009020436555147171 2023-01-24 07:24:21.078957: step: 1652/530, loss: 0.0016669457545503974 2023-01-24 07:24:22.121333: step: 1656/530, loss: 0.0023536181543022394 2023-01-24 07:24:23.160238: step: 1660/530, loss: 0.002634019125252962 2023-01-24 07:24:24.192836: step: 1664/530, loss: 0.0004650855262298137 2023-01-24 07:24:25.218516: step: 1668/530, loss: 3.0767869247938506e-06 2023-01-24 07:24:26.254240: step: 1672/530, loss: 0.0020296969451010227 2023-01-24 07:24:27.295080: step: 1676/530, loss: 0.010251333005726337 2023-01-24 07:24:28.348803: step: 1680/530, loss: 0.0019116174662485719 2023-01-24 07:24:29.392193: step: 1684/530, loss: 0.002041993662714958 2023-01-24 07:24:30.422751: step: 1688/530, loss: 0.0005865368293598294 2023-01-24 07:24:31.468413: step: 1692/530, loss: 0.006311272270977497 2023-01-24 07:24:32.518689: step: 1696/530, loss: 0.001400873064994812 2023-01-24 07:24:33.553995: step: 1700/530, loss: 0.00434342073276639 2023-01-24 07:24:34.602467: step: 1704/530, loss: 0.025829633697867393 2023-01-24 07:24:35.668016: step: 1708/530, loss: 0.0006744025740772486 2023-01-24 07:24:36.712506: step: 1712/530, loss: 0.03393099457025528 2023-01-24 07:24:37.751766: step: 1716/530, loss: 0.0016020622570067644 2023-01-24 07:24:38.790955: step: 1720/530, loss: 0.0051536038517951965 2023-01-24 07:24:39.832803: step: 1724/530, loss: 0.0013604526175186038 2023-01-24 07:24:40.874566: step: 1728/530, loss: 0.002191638108342886 2023-01-24 07:24:41.909383: step: 1732/530, loss: 0.004143086262047291 2023-01-24 07:24:42.939565: step: 1736/530, loss: 0.001980945933610201 2023-01-24 07:24:43.979764: step: 1740/530, loss: 0.0033146373461931944 2023-01-24 07:24:45.032330: step: 1744/530, loss: 0.0008635398116894066 2023-01-24 07:24:46.084338: step: 1748/530, loss: 0.0007993154576979578 2023-01-24 07:24:47.119473: step: 1752/530, loss: 0.007476922124624252 2023-01-24 07:24:48.141315: step: 1756/530, loss: 0.0017271970864385366 2023-01-24 07:24:49.187432: step: 1760/530, loss: 0.0036569773219525814 2023-01-24 07:24:50.239478: step: 1764/530, loss: 0.012102874927222729 2023-01-24 07:24:51.285522: step: 1768/530, loss: 0.0029134931974112988 2023-01-24 07:24:52.323852: step: 1772/530, loss: 0.004788354970514774 2023-01-24 07:24:53.377515: step: 1776/530, loss: 0.005316424183547497 2023-01-24 07:24:54.412413: step: 1780/530, loss: 0.0001454366574762389 2023-01-24 07:24:55.464791: step: 1784/530, loss: 0.0022293354850262403 2023-01-24 07:24:56.525420: step: 1788/530, loss: 0.002906629117205739 2023-01-24 07:24:57.558354: step: 1792/530, loss: 0.0021648481488227844 2023-01-24 07:24:58.600082: step: 1796/530, loss: 0.004671917762607336 2023-01-24 07:24:59.643803: step: 1800/530, loss: 0.0009187126997858286 2023-01-24 07:25:00.692202: step: 1804/530, loss: 2.7696472898242064e-05 2023-01-24 07:25:01.732707: step: 1808/530, loss: 3.3388175779691665e-06 2023-01-24 07:25:02.779882: step: 1812/530, loss: 0.0053504277020692825 2023-01-24 07:25:03.827966: step: 1816/530, loss: 0.017988860607147217 2023-01-24 07:25:04.883521: step: 1820/530, loss: 0.014643198810517788 2023-01-24 07:25:05.915250: step: 1824/530, loss: 0.0002301150670973584 2023-01-24 07:25:06.970821: step: 1828/530, loss: 0.0004803269694093615 2023-01-24 07:25:08.023668: step: 1832/530, loss: 0.002894968492910266 2023-01-24 07:25:09.061023: step: 1836/530, loss: 0.0004744551260955632 2023-01-24 07:25:10.096893: step: 1840/530, loss: 0.006309863179922104 2023-01-24 07:25:11.132820: step: 1844/530, loss: 0.0023878691717982292 2023-01-24 07:25:12.170196: step: 1848/530, loss: 0.004327582661062479 2023-01-24 07:25:13.227445: step: 1852/530, loss: 0.0008615344413556159 2023-01-24 07:25:14.267513: step: 1856/530, loss: 0.0060831839218735695 2023-01-24 07:25:15.306873: step: 1860/530, loss: 0.009197462350130081 2023-01-24 07:25:16.366725: step: 1864/530, loss: 0.011733553372323513 2023-01-24 07:25:17.421312: step: 1868/530, loss: 0.0011479125823825598 2023-01-24 07:25:18.484079: step: 1872/530, loss: 0.0035104809794574976 2023-01-24 07:25:19.536318: step: 1876/530, loss: 0.0014737641904503107 2023-01-24 07:25:20.573904: step: 1880/530, loss: 0.0024089596699923277 2023-01-24 07:25:21.609970: step: 1884/530, loss: 0.0022961804643273354 2023-01-24 07:25:22.651046: step: 1888/530, loss: 0.00016385501658078283 2023-01-24 07:25:23.700459: step: 1892/530, loss: 0.00033712349249981344 2023-01-24 07:25:24.743184: step: 1896/530, loss: 0.003500109538435936 2023-01-24 07:25:25.767095: step: 1900/530, loss: 0.0007390539976768196 2023-01-24 07:25:26.803848: step: 1904/530, loss: 0.0025128498673439026 2023-01-24 07:25:27.834049: step: 1908/530, loss: 0.0035820286720991135 2023-01-24 07:25:28.887937: step: 1912/530, loss: 0.002480883616954088 2023-01-24 07:25:29.940523: step: 1916/530, loss: 0.00043412024388089776 2023-01-24 07:25:30.981733: step: 1920/530, loss: 0.004388145636767149 2023-01-24 07:25:32.029485: step: 1924/530, loss: 0.004806217737495899 2023-01-24 07:25:33.090742: step: 1928/530, loss: 0.001881759730167687 2023-01-24 07:25:34.122808: step: 1932/530, loss: 0.0013274835655465722 2023-01-24 07:25:35.165069: step: 1936/530, loss: 0.004924659617245197 2023-01-24 07:25:36.230380: step: 1940/530, loss: 0.0043535600416362286 2023-01-24 07:25:37.291147: step: 1944/530, loss: 0.0009400070994161069 2023-01-24 07:25:38.326595: step: 1948/530, loss: 0.0029635753016918898 2023-01-24 07:25:39.383548: step: 1952/530, loss: 0.016656367108225822 2023-01-24 07:25:40.422471: step: 1956/530, loss: 0.007154458202421665 2023-01-24 07:25:41.464461: step: 1960/530, loss: 0.004404411185532808 2023-01-24 07:25:42.526463: step: 1964/530, loss: 0.019092516973614693 2023-01-24 07:25:43.571548: step: 1968/530, loss: 0.0008912922930903733 2023-01-24 07:25:44.614748: step: 1972/530, loss: 0.007620178163051605 2023-01-24 07:25:45.655629: step: 1976/530, loss: 0.009262746199965477 2023-01-24 07:25:46.692482: step: 1980/530, loss: 0.001222970080561936 2023-01-24 07:25:47.743877: step: 1984/530, loss: 0.02876569703221321 2023-01-24 07:25:48.796956: step: 1988/530, loss: 0.012764384038746357 2023-01-24 07:25:49.834034: step: 1992/530, loss: 0.0068854037672281265 2023-01-24 07:25:50.871918: step: 1996/530, loss: 0.0028152288869023323 2023-01-24 07:25:51.911427: step: 2000/530, loss: 0.008710321970283985 2023-01-24 07:25:52.954524: step: 2004/530, loss: 0.010089727118611336 2023-01-24 07:25:54.000875: step: 2008/530, loss: 0.0015571370022371411 2023-01-24 07:25:55.065421: step: 2012/530, loss: 0.0030157379806041718 2023-01-24 07:25:56.103220: step: 2016/530, loss: 0.003949727397412062 2023-01-24 07:25:57.149236: step: 2020/530, loss: 0.012688472867012024 2023-01-24 07:25:58.181975: step: 2024/530, loss: 0.007030210457742214 2023-01-24 07:25:59.250178: step: 2028/530, loss: 0.0010272155050188303 2023-01-24 07:26:00.306224: step: 2032/530, loss: 0.001649027573876083 2023-01-24 07:26:01.335803: step: 2036/530, loss: 0.001951180980540812 2023-01-24 07:26:02.368989: step: 2040/530, loss: 0.01001209206879139 2023-01-24 07:26:03.415695: step: 2044/530, loss: 0.012277515605092049 2023-01-24 07:26:04.450968: step: 2048/530, loss: 0.0004959240322932601 2023-01-24 07:26:05.487621: step: 2052/530, loss: 0.0002777222834993154 2023-01-24 07:26:06.532813: step: 2056/530, loss: 0.00783250480890274 2023-01-24 07:26:07.584897: step: 2060/530, loss: 0.008940855041146278 2023-01-24 07:26:08.630788: step: 2064/530, loss: 0.006159218028187752 2023-01-24 07:26:09.670781: step: 2068/530, loss: 0.005878178868442774 2023-01-24 07:26:10.695911: step: 2072/530, loss: 0.0003231469017919153 2023-01-24 07:26:11.744935: step: 2076/530, loss: 0.0013630922185257077 2023-01-24 07:26:12.780350: step: 2080/530, loss: 0.0007030994165688753 2023-01-24 07:26:13.817345: step: 2084/530, loss: 1.783264087862335e-05 2023-01-24 07:26:14.845736: step: 2088/530, loss: 0.003977149724960327 2023-01-24 07:26:15.883042: step: 2092/530, loss: 0.004377401899546385 2023-01-24 07:26:16.927005: step: 2096/530, loss: 0.004633416887372732 2023-01-24 07:26:17.959596: step: 2100/530, loss: 0.011995643377304077 2023-01-24 07:26:19.010520: step: 2104/530, loss: 0.0018599849427118897 2023-01-24 07:26:20.058525: step: 2108/530, loss: 0.00544124748557806 2023-01-24 07:26:21.102260: step: 2112/530, loss: 0.0022559345234185457 2023-01-24 07:26:22.157045: step: 2116/530, loss: 0.0004722154699265957 2023-01-24 07:26:23.195315: step: 2120/530, loss: 0.0026975416112691164 ================================================== Loss: 0.004 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.39184271364795925, 'r': 0.33310348332881545, 'f1': 0.3600934065934066}, 'combined': 0.265331983805668, 'stategy': 1, 'epoch': 12} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3731503814117339, 'r': 0.3686917831044246, 'f1': 0.3709076837888247}, 'combined': 0.2874978218841608, 'stategy': 1, 'epoch': 12} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38265397258058376, 'r': 0.33473146368054857, 'f1': 0.3570920675296541}, 'combined': 0.26312047081132406, 'stategy': 1, 'epoch': 12} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36080409985833045, 'r': 0.3604724784430195, 'f1': 0.36063821291586684}, 'combined': 0.27953775355201166, 'stategy': 1, 'epoch': 12} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 12} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 12} New best chinese model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 13 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 07:28:51.987274: step: 4/530, loss: 0.0015571422409266233 2023-01-24 07:28:53.022308: step: 8/530, loss: 0.030922045931220055 2023-01-24 07:28:54.059055: step: 12/530, loss: 1.8962708054459654e-05 2023-01-24 07:28:55.094718: step: 16/530, loss: 0.0021634192671626806 2023-01-24 07:28:56.132831: step: 20/530, loss: 0.0017400651704519987 2023-01-24 07:28:57.184011: step: 24/530, loss: 0.0016387642826884985 2023-01-24 07:28:58.217437: step: 28/530, loss: 0.0032358199823647738 2023-01-24 07:28:59.261253: step: 32/530, loss: 0.014631346799433231 2023-01-24 07:29:00.287618: step: 36/530, loss: 4.699534838437103e-05 2023-01-24 07:29:01.318566: step: 40/530, loss: 0.005617233458906412 2023-01-24 07:29:02.360683: step: 44/530, loss: 0.011924831196665764 2023-01-24 07:29:03.416841: step: 48/530, loss: 0.011535929515957832 2023-01-24 07:29:04.457669: step: 52/530, loss: 0.0016216832445934415 2023-01-24 07:29:05.492045: step: 56/530, loss: 0.004749161656945944 2023-01-24 07:29:06.532205: step: 60/530, loss: 0.004102516453713179 2023-01-24 07:29:07.573503: step: 64/530, loss: 0.013086911290884018 2023-01-24 07:29:08.604960: step: 68/530, loss: 0.0016393022378906608 2023-01-24 07:29:09.647673: step: 72/530, loss: 0.024492744356393814 2023-01-24 07:29:10.680759: step: 76/530, loss: 0.0016527425032109022 2023-01-24 07:29:11.732445: step: 80/530, loss: 0.0040021478198468685 2023-01-24 07:29:12.777883: step: 84/530, loss: 0.003007357008755207 2023-01-24 07:29:13.822702: step: 88/530, loss: 0.028197692707180977 2023-01-24 07:29:14.863099: step: 92/530, loss: 0.0030906435567885637 2023-01-24 07:29:15.901864: step: 96/530, loss: 0.07146855443716049 2023-01-24 07:29:16.944114: step: 100/530, loss: 0.01033016201108694 2023-01-24 07:29:18.008123: step: 104/530, loss: 0.0035208845511078835 2023-01-24 07:29:19.057067: step: 108/530, loss: 0.006997973658144474 2023-01-24 07:29:20.091019: step: 112/530, loss: 0.0059784636832773685 2023-01-24 07:29:21.143439: step: 116/530, loss: 0.0007764868787489831 2023-01-24 07:29:22.184733: step: 120/530, loss: 8.146424806909636e-05 2023-01-24 07:29:23.227101: step: 124/530, loss: 0.001662105438299477 2023-01-24 07:29:24.296666: step: 128/530, loss: 0.0019530060235410929 2023-01-24 07:29:25.325240: step: 132/530, loss: 0.0004900959902442992 2023-01-24 07:29:26.375822: step: 136/530, loss: 0.009724903851747513 2023-01-24 07:29:27.402049: step: 140/530, loss: 0.0027151990216225386 2023-01-24 07:29:28.441299: step: 144/530, loss: 0.011689571663737297 2023-01-24 07:29:29.472281: step: 148/530, loss: 2.2507805624627508e-05 2023-01-24 07:29:30.507534: step: 152/530, loss: 0.027585100382566452 2023-01-24 07:29:31.548595: step: 156/530, loss: 0.012612810358405113 2023-01-24 07:29:32.589545: step: 160/530, loss: 5.1878818339901045e-05 2023-01-24 07:29:33.627937: step: 164/530, loss: 0.00010572845349088311 2023-01-24 07:29:34.690554: step: 168/530, loss: 0.00020160217536613345 2023-01-24 07:29:35.750451: step: 172/530, loss: 0.00018560784519650042 2023-01-24 07:29:36.798310: step: 176/530, loss: 0.0031576049514114857 2023-01-24 07:29:37.850186: step: 180/530, loss: 0.00018232775619253516 2023-01-24 07:29:38.906454: step: 184/530, loss: 0.00476881442591548 2023-01-24 07:29:39.962079: step: 188/530, loss: 0.003823744598776102 2023-01-24 07:29:41.025093: step: 192/530, loss: 0.004184453282505274 2023-01-24 07:29:42.090112: step: 196/530, loss: 0.0010865589138120413 2023-01-24 07:29:43.123617: step: 200/530, loss: 0.004469935782253742 2023-01-24 07:29:44.173382: step: 204/530, loss: 0.005355439148843288 2023-01-24 07:29:45.200168: step: 208/530, loss: 0.00020306215446908027 2023-01-24 07:29:46.247791: step: 212/530, loss: 5.8835062191064935e-06 2023-01-24 07:29:47.291836: step: 216/530, loss: 0.0001871240237960592 2023-01-24 07:29:48.324105: step: 220/530, loss: 0.003004108788445592 2023-01-24 07:29:49.352575: step: 224/530, loss: 0.0036614355631172657 2023-01-24 07:29:50.389529: step: 228/530, loss: 0.00044466930557973683 2023-01-24 07:29:51.447418: step: 232/530, loss: 0.006003792863339186 2023-01-24 07:29:52.490124: step: 236/530, loss: 0.0056213694624602795 2023-01-24 07:29:53.529636: step: 240/530, loss: 0.00015426550817210227 2023-01-24 07:29:54.591821: step: 244/530, loss: 0.010886418633162975 2023-01-24 07:29:55.635113: step: 248/530, loss: 0.0052109649404883385 2023-01-24 07:29:56.669638: step: 252/530, loss: 0.0008735673618502915 2023-01-24 07:29:57.745662: step: 256/530, loss: 0.0027040031272917986 2023-01-24 07:29:58.790829: step: 260/530, loss: 0.0026758236344903708 2023-01-24 07:29:59.846539: step: 264/530, loss: 0.005143734626471996 2023-01-24 07:30:00.891351: step: 268/530, loss: 0.00439074169844389 2023-01-24 07:30:01.943448: step: 272/530, loss: 0.007239020429551601 2023-01-24 07:30:02.991562: step: 276/530, loss: 0.0026030123699456453 2023-01-24 07:30:04.040737: step: 280/530, loss: 0.012737544253468513 2023-01-24 07:30:05.086645: step: 284/530, loss: 0.0033456054516136646 2023-01-24 07:30:06.125014: step: 288/530, loss: 0.002196643501520157 2023-01-24 07:30:07.190595: step: 292/530, loss: 0.024431556463241577 2023-01-24 07:30:08.242312: step: 296/530, loss: 0.0022198008373379707 2023-01-24 07:30:09.299293: step: 300/530, loss: 0.0013652290217578411 2023-01-24 07:30:10.347810: step: 304/530, loss: 0.0040387618355453014 2023-01-24 07:30:11.410368: step: 308/530, loss: 0.00270672794431448 2023-01-24 07:30:12.473422: step: 312/530, loss: 0.006156936287879944 2023-01-24 07:30:13.523080: step: 316/530, loss: 0.0027480567805469036 2023-01-24 07:30:14.587960: step: 320/530, loss: 0.009938803501427174 2023-01-24 07:30:15.635470: step: 324/530, loss: 0.0029265740886330605 2023-01-24 07:30:16.698833: step: 328/530, loss: 0.00048030042671598494 2023-01-24 07:30:17.776163: step: 332/530, loss: 0.00372222438454628 2023-01-24 07:30:18.821092: step: 336/530, loss: 0.0003657924826256931 2023-01-24 07:30:19.870515: step: 340/530, loss: 0.011882190592586994 2023-01-24 07:30:20.905347: step: 344/530, loss: 0.003404736053198576 2023-01-24 07:30:21.975443: step: 348/530, loss: 0.0014219387667253613 2023-01-24 07:30:23.020327: step: 352/530, loss: 0.004031968303024769 2023-01-24 07:30:24.053353: step: 356/530, loss: 0.00036041345447301865 2023-01-24 07:30:25.104061: step: 360/530, loss: 0.005119792185723782 2023-01-24 07:30:26.150273: step: 364/530, loss: 0.0006487190839834511 2023-01-24 07:30:27.200566: step: 368/530, loss: 0.005295685958117247 2023-01-24 07:30:28.240608: step: 372/530, loss: 0.005596744827926159 2023-01-24 07:30:29.280820: step: 376/530, loss: 0.00036253826692700386 2023-01-24 07:30:30.323602: step: 380/530, loss: 0.0029514955822378397 2023-01-24 07:30:31.356120: step: 384/530, loss: 0.0002344045788049698 2023-01-24 07:30:32.394474: step: 388/530, loss: 0.006339217536151409 2023-01-24 07:30:33.468430: step: 392/530, loss: 0.001686254283413291 2023-01-24 07:30:34.514854: step: 396/530, loss: 0.0006472884560935199 2023-01-24 07:30:35.543780: step: 400/530, loss: 0.0028015095740556717 2023-01-24 07:30:36.581450: step: 404/530, loss: 0.0003446325717959553 2023-01-24 07:30:37.631353: step: 408/530, loss: 0.0030051255598664284 2023-01-24 07:30:38.661267: step: 412/530, loss: 0.0007342534954659641 2023-01-24 07:30:39.713006: step: 416/530, loss: 0.002018393948674202 2023-01-24 07:30:40.765922: step: 420/530, loss: 0.002326158806681633 2023-01-24 07:30:41.808461: step: 424/530, loss: 0.003065238008275628 2023-01-24 07:30:42.849237: step: 428/530, loss: 0.0031415680423378944 2023-01-24 07:30:43.922585: step: 432/530, loss: 0.0014777034521102905 2023-01-24 07:30:44.948435: step: 436/530, loss: 0.028326740488409996 2023-01-24 07:30:45.992463: step: 440/530, loss: 0.001052691601216793 2023-01-24 07:30:47.020195: step: 444/530, loss: 2.937482531706337e-05 2023-01-24 07:30:48.073887: step: 448/530, loss: 0.0043033454567193985 2023-01-24 07:30:49.124329: step: 452/530, loss: 0.0016315453685820103 2023-01-24 07:30:50.164701: step: 456/530, loss: 0.0039023798890411854 2023-01-24 07:30:51.227123: step: 460/530, loss: 0.001634332467801869 2023-01-24 07:30:52.272753: step: 464/530, loss: 0.0034528980031609535 2023-01-24 07:30:53.340584: step: 468/530, loss: 0.0026262092869728804 2023-01-24 07:30:54.382695: step: 472/530, loss: 0.0005942652933299541 2023-01-24 07:30:55.418559: step: 476/530, loss: 0.0017140927957370877 2023-01-24 07:30:56.450731: step: 480/530, loss: 0.00020897998183500022 2023-01-24 07:30:57.494698: step: 484/530, loss: 0.00015195251035038382 2023-01-24 07:30:58.545156: step: 488/530, loss: 0.008661547675728798 2023-01-24 07:30:59.593643: step: 492/530, loss: 0.006288343574851751 2023-01-24 07:31:00.641113: step: 496/530, loss: 1.9588105715229176e-05 2023-01-24 07:31:01.677091: step: 500/530, loss: 0.002119549550116062 2023-01-24 07:31:02.707911: step: 504/530, loss: 0.0059881326742470264 2023-01-24 07:31:03.756747: step: 508/530, loss: 0.01731732115149498 2023-01-24 07:31:04.795419: step: 512/530, loss: 0.00010866344382520765 2023-01-24 07:31:05.835640: step: 516/530, loss: 0.005246803164482117 2023-01-24 07:31:06.877038: step: 520/530, loss: 5.6141274399124086e-05 2023-01-24 07:31:07.928859: step: 524/530, loss: 0.003649590304121375 2023-01-24 07:31:08.984503: step: 528/530, loss: 0.015118328854441643 2023-01-24 07:31:10.023273: step: 532/530, loss: 0.001896945759654045 2023-01-24 07:31:11.085407: step: 536/530, loss: 0.0010516990441828966 2023-01-24 07:31:12.125523: step: 540/530, loss: 0.004235134460031986 2023-01-24 07:31:13.168577: step: 544/530, loss: 0.0001383834023727104 2023-01-24 07:31:14.220963: step: 548/530, loss: 0.005883309990167618 2023-01-24 07:31:15.256064: step: 552/530, loss: 0.003881060052663088 2023-01-24 07:31:16.299441: step: 556/530, loss: 0.002632217714563012 2023-01-24 07:31:17.339169: step: 560/530, loss: 0.0011256864527240396 2023-01-24 07:31:18.394336: step: 564/530, loss: 0.004862012807279825 2023-01-24 07:31:19.445623: step: 568/530, loss: 3.28724090650212e-05 2023-01-24 07:31:20.473889: step: 572/530, loss: 0.002916815457865596 2023-01-24 07:31:21.518420: step: 576/530, loss: 0.019314512610435486 2023-01-24 07:31:22.571063: step: 580/530, loss: 0.027455750852823257 2023-01-24 07:31:23.631791: step: 584/530, loss: 0.002586080925539136 2023-01-24 07:31:24.692371: step: 588/530, loss: 0.024136962369084358 2023-01-24 07:31:25.741605: step: 592/530, loss: 0.002513302257284522 2023-01-24 07:31:26.793428: step: 596/530, loss: 0.006390607450157404 2023-01-24 07:31:27.842657: step: 600/530, loss: 0.014459188096225262 2023-01-24 07:31:28.899327: step: 604/530, loss: 0.000182782590854913 2023-01-24 07:31:29.938899: step: 608/530, loss: 0.0016076830215752125 2023-01-24 07:31:30.978023: step: 612/530, loss: 0.00020894815679639578 2023-01-24 07:31:32.027841: step: 616/530, loss: 0.004454677924513817 2023-01-24 07:31:33.067408: step: 620/530, loss: 0.0024761175736784935 2023-01-24 07:31:34.116390: step: 624/530, loss: 0.00029460518271662295 2023-01-24 07:31:35.160501: step: 628/530, loss: 0.005864573642611504 2023-01-24 07:31:36.202619: step: 632/530, loss: 0.01079725194722414 2023-01-24 07:31:37.242950: step: 636/530, loss: 0.00878931488841772 2023-01-24 07:31:38.288257: step: 640/530, loss: 0.0002955848758574575 2023-01-24 07:31:39.324091: step: 644/530, loss: 0.00409247912466526 2023-01-24 07:31:40.363578: step: 648/530, loss: 0.0009163686190731823 2023-01-24 07:31:41.420991: step: 652/530, loss: 0.004951812792569399 2023-01-24 07:31:42.459509: step: 656/530, loss: 0.0007211221382021904 2023-01-24 07:31:43.506374: step: 660/530, loss: 0.015389836393296719 2023-01-24 07:31:44.554122: step: 664/530, loss: 0.0035710122901946306 2023-01-24 07:31:45.581476: step: 668/530, loss: 0.0041391681879758835 2023-01-24 07:31:46.621996: step: 672/530, loss: 0.001492330222390592 2023-01-24 07:31:47.669868: step: 676/530, loss: 0.0006232345476746559 2023-01-24 07:31:48.703304: step: 680/530, loss: 0.00012105554924346507 2023-01-24 07:31:49.734395: step: 684/530, loss: 0.007195714395493269 2023-01-24 07:31:50.771219: step: 688/530, loss: 0.004221584182232618 2023-01-24 07:31:51.799147: step: 692/530, loss: 0.00195950735360384 2023-01-24 07:31:52.855515: step: 696/530, loss: 0.00378425233066082 2023-01-24 07:31:53.906004: step: 700/530, loss: 0.000283784611383453 2023-01-24 07:31:54.939005: step: 704/530, loss: 0.007826127111911774 2023-01-24 07:31:55.979377: step: 708/530, loss: 0.0004190918989479542 2023-01-24 07:31:57.021653: step: 712/530, loss: 0.0010957118356600404 2023-01-24 07:31:58.048028: step: 716/530, loss: 0.0013870338443666697 2023-01-24 07:31:59.091647: step: 720/530, loss: 0.014821946620941162 2023-01-24 07:32:00.137512: step: 724/530, loss: 0.0030724769458174706 2023-01-24 07:32:01.176901: step: 728/530, loss: 0.003331148996949196 2023-01-24 07:32:02.224141: step: 732/530, loss: 0.0018085388001054525 2023-01-24 07:32:03.257076: step: 736/530, loss: 0.0015410431660711765 2023-01-24 07:32:04.292207: step: 740/530, loss: 0.0004999007796868682 2023-01-24 07:32:05.340088: step: 744/530, loss: 0.007473272737115622 2023-01-24 07:32:06.397374: step: 748/530, loss: 0.0010935214813798666 2023-01-24 07:32:07.443810: step: 752/530, loss: 7.650296174688265e-05 2023-01-24 07:32:08.494723: step: 756/530, loss: 0.001337980735115707 2023-01-24 07:32:09.544354: step: 760/530, loss: 0.0056527829729020596 2023-01-24 07:32:10.604360: step: 764/530, loss: 3.669329089461826e-05 2023-01-24 07:32:11.640781: step: 768/530, loss: 0.008626979775726795 2023-01-24 07:32:12.693782: step: 772/530, loss: 0.0051635438576340675 2023-01-24 07:32:13.744714: step: 776/530, loss: 0.008310437202453613 2023-01-24 07:32:14.779270: step: 780/530, loss: 0.0001906199031509459 2023-01-24 07:32:15.840316: step: 784/530, loss: 0.002033921657130122 2023-01-24 07:32:16.875900: step: 788/530, loss: 0.0045344773679971695 2023-01-24 07:32:17.926756: step: 792/530, loss: 0.05590024217963219 2023-01-24 07:32:18.954099: step: 796/530, loss: 1.7934558854904026e-05 2023-01-24 07:32:20.003298: step: 800/530, loss: 0.0006921774474903941 2023-01-24 07:32:21.055221: step: 804/530, loss: 0.004721867851912975 2023-01-24 07:32:22.083563: step: 808/530, loss: 0.003283181693404913 2023-01-24 07:32:23.117265: step: 812/530, loss: 0.004787980578839779 2023-01-24 07:32:24.164380: step: 816/530, loss: 0.02432870678603649 2023-01-24 07:32:25.195979: step: 820/530, loss: 0.000611655879765749 2023-01-24 07:32:26.243176: step: 824/530, loss: 0.002131052315235138 2023-01-24 07:32:27.282849: step: 828/530, loss: 0.0027392380870878696 2023-01-24 07:32:28.323650: step: 832/530, loss: 0.022219443693757057 2023-01-24 07:32:29.366017: step: 836/530, loss: 0.00564951915293932 2023-01-24 07:32:30.404538: step: 840/530, loss: 0.0034556053578853607 2023-01-24 07:32:31.446876: step: 844/530, loss: 0.0027208374813199043 2023-01-24 07:32:32.494737: step: 848/530, loss: 0.005269872955977917 2023-01-24 07:32:33.538259: step: 852/530, loss: 0.01046881452202797 2023-01-24 07:32:34.592184: step: 856/530, loss: 0.005150248762220144 2023-01-24 07:32:35.638584: step: 860/530, loss: 0.00027264413074590266 2023-01-24 07:32:36.686756: step: 864/530, loss: 0.002326930407434702 2023-01-24 07:32:37.739064: step: 868/530, loss: 0.0020518675446510315 2023-01-24 07:32:38.786590: step: 872/530, loss: 2.2392792743630707e-05 2023-01-24 07:32:39.837320: step: 876/530, loss: 0.020775049924850464 2023-01-24 07:32:40.882007: step: 880/530, loss: 0.004205694422125816 2023-01-24 07:32:41.920390: step: 884/530, loss: 0.006371791008859873 2023-01-24 07:32:42.941439: step: 888/530, loss: 0.00424738647416234 2023-01-24 07:32:43.984245: step: 892/530, loss: 8.481772965751588e-06 2023-01-24 07:32:45.032197: step: 896/530, loss: 0.0003902267199009657 2023-01-24 07:32:46.085897: step: 900/530, loss: 0.008825684897601604 2023-01-24 07:32:47.131997: step: 904/530, loss: 0.004071269650012255 2023-01-24 07:32:48.184943: step: 908/530, loss: 0.004793594591319561 2023-01-24 07:32:49.233433: step: 912/530, loss: 0.003112341742962599 2023-01-24 07:32:50.266518: step: 916/530, loss: 0.015471885912120342 2023-01-24 07:32:51.335767: step: 920/530, loss: 0.0035965389106422663 2023-01-24 07:32:52.382260: step: 924/530, loss: 0.001437822007574141 2023-01-24 07:32:53.422412: step: 928/530, loss: 0.004162083379924297 2023-01-24 07:32:54.459386: step: 932/530, loss: 0.001630387851037085 2023-01-24 07:32:55.514227: step: 936/530, loss: 0.0011927802115678787 2023-01-24 07:32:56.554883: step: 940/530, loss: 0.001629486447200179 2023-01-24 07:32:57.608206: step: 944/530, loss: 0.0002522141730878502 2023-01-24 07:32:58.651853: step: 948/530, loss: 0.004102247301489115 2023-01-24 07:32:59.707424: step: 952/530, loss: 0.00547128776088357 2023-01-24 07:33:00.747931: step: 956/530, loss: 0.004373923409730196 2023-01-24 07:33:01.784263: step: 960/530, loss: 0.006631750147789717 2023-01-24 07:33:02.834596: step: 964/530, loss: 0.0028928297106176615 2023-01-24 07:33:03.870833: step: 968/530, loss: 0.002853579353541136 2023-01-24 07:33:04.919162: step: 972/530, loss: 0.04011954739689827 2023-01-24 07:33:05.973012: step: 976/530, loss: 0.01069098711013794 2023-01-24 07:33:07.022868: step: 980/530, loss: 0.0030946913175284863 2023-01-24 07:33:08.072377: step: 984/530, loss: 0.0003545731015037745 2023-01-24 07:33:09.128544: step: 988/530, loss: 0.006341470871120691 2023-01-24 07:33:10.179680: step: 992/530, loss: 0.00206725369207561 2023-01-24 07:33:11.221649: step: 996/530, loss: 0.00016413701814599335 2023-01-24 07:33:12.261209: step: 1000/530, loss: 0.006029443349689245 2023-01-24 07:33:13.305237: step: 1004/530, loss: 0.0014888123841956258 2023-01-24 07:33:14.338344: step: 1008/530, loss: 0.0010760299628600478 2023-01-24 07:33:15.391971: step: 1012/530, loss: 0.00012965213682036847 2023-01-24 07:33:16.438555: step: 1016/530, loss: 0.0073159015737473965 2023-01-24 07:33:17.481694: step: 1020/530, loss: 0.03320840001106262 2023-01-24 07:33:18.534884: step: 1024/530, loss: 0.001997166546061635 2023-01-24 07:33:19.600946: step: 1028/530, loss: 0.0015836649108678102 2023-01-24 07:33:20.630928: step: 1032/530, loss: 0.0006292597972787917 2023-01-24 07:33:21.681683: step: 1036/530, loss: 0.004962176084518433 2023-01-24 07:33:22.727970: step: 1040/530, loss: 0.002139468677341938 2023-01-24 07:33:23.779047: step: 1044/530, loss: 0.00261810515075922 2023-01-24 07:33:24.838243: step: 1048/530, loss: 0.00012861681170761585 2023-01-24 07:33:25.896160: step: 1052/530, loss: 0.009888764470815659 2023-01-24 07:33:26.948294: step: 1056/530, loss: 0.002490539336577058 2023-01-24 07:33:27.995424: step: 1060/530, loss: 0.0007864373619668186 2023-01-24 07:33:29.039032: step: 1064/530, loss: 0.0013424664502963424 2023-01-24 07:33:30.079266: step: 1068/530, loss: 0.0022708941251039505 2023-01-24 07:33:31.128544: step: 1072/530, loss: 0.0012711402960121632 2023-01-24 07:33:32.166088: step: 1076/530, loss: 0.0021786584984511137 2023-01-24 07:33:33.233783: step: 1080/530, loss: 0.013784159906208515 2023-01-24 07:33:34.276449: step: 1084/530, loss: 0.00919702835381031 2023-01-24 07:33:35.325707: step: 1088/530, loss: 0.003673143684864044 2023-01-24 07:33:36.376687: step: 1092/530, loss: 0.0008947818423621356 2023-01-24 07:33:37.428491: step: 1096/530, loss: 0.00632647518068552 2023-01-24 07:33:38.473751: step: 1100/530, loss: 0.0008677636506035924 2023-01-24 07:33:39.510802: step: 1104/530, loss: 0.003444284200668335 2023-01-24 07:33:40.558303: step: 1108/530, loss: 0.002046301495283842 2023-01-24 07:33:41.613732: step: 1112/530, loss: 0.004305703099817038 2023-01-24 07:33:42.646811: step: 1116/530, loss: 0.0027629919350147247 2023-01-24 07:33:43.684698: step: 1120/530, loss: 0.0011827803682535887 2023-01-24 07:33:44.716736: step: 1124/530, loss: 0.0020097398664802313 2023-01-24 07:33:45.750637: step: 1128/530, loss: 0.007096866611391306 2023-01-24 07:33:46.798212: step: 1132/530, loss: 0.0035088739823549986 2023-01-24 07:33:47.844356: step: 1136/530, loss: 0.048875074833631516 2023-01-24 07:33:48.892067: step: 1140/530, loss: 0.004634476266801357 2023-01-24 07:33:49.922154: step: 1144/530, loss: 0.006554277613759041 2023-01-24 07:33:50.994773: step: 1148/530, loss: 0.008395140990614891 2023-01-24 07:33:52.026825: step: 1152/530, loss: 0.020909395068883896 2023-01-24 07:33:53.068369: step: 1156/530, loss: 0.009959312155842781 2023-01-24 07:33:54.116149: step: 1160/530, loss: 0.00084947410505265 2023-01-24 07:33:55.149335: step: 1164/530, loss: 0.0018255636096000671 2023-01-24 07:33:56.192910: step: 1168/530, loss: 0.0016596734058111906 2023-01-24 07:33:57.237019: step: 1172/530, loss: 0.010130630806088448 2023-01-24 07:33:58.286528: step: 1176/530, loss: 0.012636475265026093 2023-01-24 07:33:59.332908: step: 1180/530, loss: 0.001632831641472876 2023-01-24 07:34:00.380705: step: 1184/530, loss: 0.0021776848006993532 2023-01-24 07:34:01.444847: step: 1188/530, loss: 0.004113419447094202 2023-01-24 07:34:02.467353: step: 1192/530, loss: 0.001228248467668891 2023-01-24 07:34:03.503363: step: 1196/530, loss: 0.0026793447323143482 2023-01-24 07:34:04.543142: step: 1200/530, loss: 0.0011773507576435804 2023-01-24 07:34:05.574058: step: 1204/530, loss: 0.006706334184855223 2023-01-24 07:34:06.615910: step: 1208/530, loss: 0.0030336366035044193 2023-01-24 07:34:07.653454: step: 1212/530, loss: 0.00010942178778350353 2023-01-24 07:34:08.713034: step: 1216/530, loss: 0.0059114741161465645 2023-01-24 07:34:09.761135: step: 1220/530, loss: 0.0011902586556971073 2023-01-24 07:34:10.789993: step: 1224/530, loss: 0.00015489596989937127 2023-01-24 07:34:11.856338: step: 1228/530, loss: 0.003276297589763999 2023-01-24 07:34:12.941081: step: 1232/530, loss: 0.009583234786987305 2023-01-24 07:34:13.981761: step: 1236/530, loss: 0.0025826788041740656 2023-01-24 07:34:15.027260: step: 1240/530, loss: 0.0003689672448672354 2023-01-24 07:34:16.084573: step: 1244/530, loss: 0.012525648809969425 2023-01-24 07:34:17.155163: step: 1248/530, loss: 0.0009635971509851515 2023-01-24 07:34:18.217569: step: 1252/530, loss: 0.011210901662707329 2023-01-24 07:34:19.268627: step: 1256/530, loss: 0.0628322884440422 2023-01-24 07:34:20.322791: step: 1260/530, loss: 0.00035624243901111186 2023-01-24 07:34:21.380237: step: 1264/530, loss: 0.008533705957233906 2023-01-24 07:34:22.427385: step: 1268/530, loss: 0.0076182191260159016 2023-01-24 07:34:23.489533: step: 1272/530, loss: 0.01421476248651743 2023-01-24 07:34:24.552077: step: 1276/530, loss: 0.0002834429033100605 2023-01-24 07:34:25.590903: step: 1280/530, loss: 0.0006229953723959625 2023-01-24 07:34:26.631606: step: 1284/530, loss: 0.03549204766750336 2023-01-24 07:34:27.653999: step: 1288/530, loss: 0.005786415189504623 2023-01-24 07:34:28.700432: step: 1292/530, loss: 0.005944854114204645 2023-01-24 07:34:29.753870: step: 1296/530, loss: 0.006631250958889723 2023-01-24 07:34:30.803201: step: 1300/530, loss: 0.00032243935856968164 2023-01-24 07:34:31.848339: step: 1304/530, loss: 0.00040961033664643764 2023-01-24 07:34:32.878368: step: 1308/530, loss: 5.458933810587041e-05 2023-01-24 07:34:33.925868: step: 1312/530, loss: 0.006803466472774744 2023-01-24 07:34:34.975765: step: 1316/530, loss: 0.019153432920575142 2023-01-24 07:34:36.014610: step: 1320/530, loss: 0.005157252307981253 2023-01-24 07:34:37.055032: step: 1324/530, loss: 0.002538437256589532 2023-01-24 07:34:38.102675: step: 1328/530, loss: 0.007687521632760763 2023-01-24 07:34:39.176011: step: 1332/530, loss: 0.003714543767273426 2023-01-24 07:34:40.231308: step: 1336/530, loss: 0.0004724572936538607 2023-01-24 07:34:41.250228: step: 1340/530, loss: 0.011397608555853367 2023-01-24 07:34:42.285545: step: 1344/530, loss: 0.0017039562808349729 2023-01-24 07:34:43.317526: step: 1348/530, loss: 0.00597368786111474 2023-01-24 07:34:44.346527: step: 1352/530, loss: 0.0006003369344398379 2023-01-24 07:34:45.389499: step: 1356/530, loss: 0.0037561943754553795 2023-01-24 07:34:46.429256: step: 1360/530, loss: 0.0009858902776613832 2023-01-24 07:34:47.464224: step: 1364/530, loss: 0.0031159569043666124 2023-01-24 07:34:48.511596: step: 1368/530, loss: 0.010406256653368473 2023-01-24 07:34:49.553379: step: 1372/530, loss: 0.0011819112114608288 2023-01-24 07:34:50.587942: step: 1376/530, loss: 0.0020991957280784845 2023-01-24 07:34:51.629361: step: 1380/530, loss: 1.8438924598740414e-05 2023-01-24 07:34:52.669003: step: 1384/530, loss: 0.011804255656898022 2023-01-24 07:34:53.699563: step: 1388/530, loss: 0.00108500593341887 2023-01-24 07:34:54.741011: step: 1392/530, loss: 0.0072795734740793705 2023-01-24 07:34:55.778803: step: 1396/530, loss: 0.009046620689332485 2023-01-24 07:34:56.822025: step: 1400/530, loss: 0.0010546050034463406 2023-01-24 07:34:57.855209: step: 1404/530, loss: 0.0017449066508561373 2023-01-24 07:34:58.879458: step: 1408/530, loss: 0.0054543218575417995 2023-01-24 07:34:59.914057: step: 1412/530, loss: 0.003199639730155468 2023-01-24 07:35:00.945268: step: 1416/530, loss: 0.01098174974322319 2023-01-24 07:35:01.988079: step: 1420/530, loss: 0.0005343706579878926 2023-01-24 07:35:03.020460: step: 1424/530, loss: 0.002258996246382594 2023-01-24 07:35:04.054845: step: 1428/530, loss: 0.0041306097991764545 2023-01-24 07:35:05.114216: step: 1432/530, loss: 0.0025656200014054775 2023-01-24 07:35:06.160494: step: 1436/530, loss: 0.00023132514616008848 2023-01-24 07:35:07.214852: step: 1440/530, loss: 0.015931788831949234 2023-01-24 07:35:08.272248: step: 1444/530, loss: 0.003699875669553876 2023-01-24 07:35:09.322456: step: 1448/530, loss: 0.00031317255343310535 2023-01-24 07:35:10.373200: step: 1452/530, loss: 0.004651620052754879 2023-01-24 07:35:11.414611: step: 1456/530, loss: 0.0044815391302108765 2023-01-24 07:35:12.448767: step: 1460/530, loss: 0.006552047561854124 2023-01-24 07:35:13.478291: step: 1464/530, loss: 0.014346626587212086 2023-01-24 07:35:14.527519: step: 1468/530, loss: 0.007444246206432581 2023-01-24 07:35:15.562474: step: 1472/530, loss: 0.000994421192444861 2023-01-24 07:35:16.600479: step: 1476/530, loss: 0.00458028819411993 2023-01-24 07:35:17.632738: step: 1480/530, loss: 0.017577188089489937 2023-01-24 07:35:18.702364: step: 1484/530, loss: 0.008681370876729488 2023-01-24 07:35:19.737381: step: 1488/530, loss: 0.005712204147130251 2023-01-24 07:35:20.782239: step: 1492/530, loss: 0.0025118859484791756 2023-01-24 07:35:21.820024: step: 1496/530, loss: 0.0019111614674329758 2023-01-24 07:35:22.857261: step: 1500/530, loss: 0.015634384006261826 2023-01-24 07:35:23.899821: step: 1504/530, loss: 6.193132139742374e-05 2023-01-24 07:35:24.937176: step: 1508/530, loss: 0.0022996177431195974 2023-01-24 07:35:25.973255: step: 1512/530, loss: 0.000562844390515238 2023-01-24 07:35:27.005238: step: 1516/530, loss: 0.0022139009088277817 2023-01-24 07:35:28.045078: step: 1520/530, loss: 0.004894523415714502 2023-01-24 07:35:29.084683: step: 1524/530, loss: 0.002735221991315484 2023-01-24 07:35:30.120754: step: 1528/530, loss: 0.0003832722140941769 2023-01-24 07:35:31.154214: step: 1532/530, loss: 5.590159707935527e-05 2023-01-24 07:35:32.217260: step: 1536/530, loss: 0.0008702100603841245 2023-01-24 07:35:33.260117: step: 1540/530, loss: 0.0027145619969815016 2023-01-24 07:35:34.286007: step: 1544/530, loss: 0.009531828574836254 2023-01-24 07:35:35.314615: step: 1548/530, loss: 0.0027640785556286573 2023-01-24 07:35:36.360784: step: 1552/530, loss: 0.0012578010791912675 2023-01-24 07:35:37.400642: step: 1556/530, loss: 0.0012349880998954177 2023-01-24 07:35:38.465090: step: 1560/530, loss: 0.007865747436881065 2023-01-24 07:35:39.511542: step: 1564/530, loss: 6.35531687294133e-05 2023-01-24 07:35:40.559922: step: 1568/530, loss: 0.002713732188567519 2023-01-24 07:35:41.591956: step: 1572/530, loss: 0.012991324067115784 2023-01-24 07:35:42.628277: step: 1576/530, loss: 0.0036734689492732286 2023-01-24 07:35:43.677683: step: 1580/530, loss: 0.003625119337812066 2023-01-24 07:35:44.720243: step: 1584/530, loss: 0.006219614762812853 2023-01-24 07:35:45.761234: step: 1588/530, loss: 0.004824534524232149 2023-01-24 07:35:46.817576: step: 1592/530, loss: 0.001988767646253109 2023-01-24 07:35:47.852785: step: 1596/530, loss: 0.0018592308042570949 2023-01-24 07:35:48.892506: step: 1600/530, loss: 0.00017500405374448746 2023-01-24 07:35:49.940295: step: 1604/530, loss: 0.0003702268295455724 2023-01-24 07:35:50.984903: step: 1608/530, loss: 0.0009201056091114879 2023-01-24 07:35:52.030727: step: 1612/530, loss: 0.002125175204128027 2023-01-24 07:35:53.079989: step: 1616/530, loss: 0.0005968852783553302 2023-01-24 07:35:54.150518: step: 1620/530, loss: 0.004435297567397356 2023-01-24 07:35:55.187496: step: 1624/530, loss: 0.0012423850130289793 2023-01-24 07:35:56.221016: step: 1628/530, loss: 0.003851365763694048 2023-01-24 07:35:57.262195: step: 1632/530, loss: 0.002519437577575445 2023-01-24 07:35:58.310179: step: 1636/530, loss: 0.0018792204791679978 2023-01-24 07:35:59.358951: step: 1640/530, loss: 0.010292806662619114 2023-01-24 07:36:00.398276: step: 1644/530, loss: 0.00264140241779387 2023-01-24 07:36:01.430706: step: 1648/530, loss: 0.01529796700924635 2023-01-24 07:36:02.467419: step: 1652/530, loss: 7.053388253552839e-05 2023-01-24 07:36:03.513485: step: 1656/530, loss: 0.002264065435156226 2023-01-24 07:36:04.561881: step: 1660/530, loss: 0.008241772651672363 2023-01-24 07:36:05.607867: step: 1664/530, loss: 0.0135966707020998 2023-01-24 07:36:06.672738: step: 1668/530, loss: 0.001481459359638393 2023-01-24 07:36:07.713833: step: 1672/530, loss: 0.001255618641152978 2023-01-24 07:36:08.748432: step: 1676/530, loss: 1.674937993811909e-05 2023-01-24 07:36:09.781336: step: 1680/530, loss: 0.000871616299264133 2023-01-24 07:36:10.819888: step: 1684/530, loss: 0.006060166284441948 2023-01-24 07:36:11.862049: step: 1688/530, loss: 0.002602911554276943 2023-01-24 07:36:12.903699: step: 1692/530, loss: 0.008479427546262741 2023-01-24 07:36:13.944708: step: 1696/530, loss: 0.004388756118714809 2023-01-24 07:36:14.991475: step: 1700/530, loss: 0.0019102790392935276 2023-01-24 07:36:16.012005: step: 1704/530, loss: 0.0028448302764445543 2023-01-24 07:36:17.048722: step: 1708/530, loss: 0.001294395886361599 2023-01-24 07:36:18.099976: step: 1712/530, loss: 0.0010381778702139854 2023-01-24 07:36:19.142436: step: 1716/530, loss: 5.277915988699533e-05 2023-01-24 07:36:20.181507: step: 1720/530, loss: 0.00370697770267725 2023-01-24 07:36:21.231059: step: 1724/530, loss: 0.00488363578915596 2023-01-24 07:36:22.275626: step: 1728/530, loss: 0.00016378391592297703 2023-01-24 07:36:23.317106: step: 1732/530, loss: 0.00869457982480526 2023-01-24 07:36:24.374071: step: 1736/530, loss: 0.0037480397149920464 2023-01-24 07:36:25.417637: step: 1740/530, loss: 0.0014802840305492282 2023-01-24 07:36:26.451555: step: 1744/530, loss: 0.004918827209621668 2023-01-24 07:36:27.494451: step: 1748/530, loss: 0.00018765602726489305 2023-01-24 07:36:28.524834: step: 1752/530, loss: 0.003437806386500597 2023-01-24 07:36:29.568464: step: 1756/530, loss: 0.008813544176518917 2023-01-24 07:36:30.615302: step: 1760/530, loss: 0.0030842965934425592 2023-01-24 07:36:31.665121: step: 1764/530, loss: 0.0016851763939484954 2023-01-24 07:36:32.699636: step: 1768/530, loss: 0.005564452148973942 2023-01-24 07:36:33.750944: step: 1772/530, loss: 0.001565176760777831 2023-01-24 07:36:34.795242: step: 1776/530, loss: 0.0032003254164010286 2023-01-24 07:36:35.829277: step: 1780/530, loss: 0.00029246561462059617 2023-01-24 07:36:36.872766: step: 1784/530, loss: 0.003704949514940381 2023-01-24 07:36:37.907902: step: 1788/530, loss: 0.0005255469004623592 2023-01-24 07:36:38.942100: step: 1792/530, loss: 7.619876851094887e-05 2023-01-24 07:36:39.986630: step: 1796/530, loss: 7.677255780436099e-05 2023-01-24 07:36:41.032932: step: 1800/530, loss: 0.007118364796042442 2023-01-24 07:36:42.057183: step: 1804/530, loss: 0.012570079416036606 2023-01-24 07:36:43.098057: step: 1808/530, loss: 0.0025873431004583836 2023-01-24 07:36:44.122799: step: 1812/530, loss: 0.008247978053987026 2023-01-24 07:36:45.183597: step: 1816/530, loss: 0.002031999407336116 2023-01-24 07:36:46.219065: step: 1820/530, loss: 0.00504956254735589 2023-01-24 07:36:47.251036: step: 1824/530, loss: 0.00272430875338614 2023-01-24 07:36:48.285449: step: 1828/530, loss: 0.013086101971566677 2023-01-24 07:36:49.335585: step: 1832/530, loss: 0.004631635267287493 2023-01-24 07:36:50.391345: step: 1836/530, loss: 0.0031072490382939577 2023-01-24 07:36:51.412641: step: 1840/530, loss: 0.0022203095722943544 2023-01-24 07:36:52.462774: step: 1844/530, loss: 0.0038919190410524607 2023-01-24 07:36:53.503919: step: 1848/530, loss: 0.008435151539742947 2023-01-24 07:36:54.547589: step: 1852/530, loss: 0.0022114517632871866 2023-01-24 07:36:55.625755: step: 1856/530, loss: 0.005317586474120617 2023-01-24 07:36:56.662464: step: 1860/530, loss: 0.003897308837622404 2023-01-24 07:36:57.693399: step: 1864/530, loss: 0.0029801796190440655 2023-01-24 07:36:58.749999: step: 1868/530, loss: 0.003196819219738245 2023-01-24 07:36:59.781997: step: 1872/530, loss: 0.01514542754739523 2023-01-24 07:37:00.828740: step: 1876/530, loss: 0.012041516602039337 2023-01-24 07:37:01.883909: step: 1880/530, loss: 0.0013830275274813175 2023-01-24 07:37:02.935022: step: 1884/530, loss: 0.0024755746126174927 2023-01-24 07:37:03.975529: step: 1888/530, loss: 0.00011815586185548455 2023-01-24 07:37:05.016828: step: 1892/530, loss: 0.0077399080619215965 2023-01-24 07:37:06.060091: step: 1896/530, loss: 0.0023121931590139866 2023-01-24 07:37:07.090516: step: 1900/530, loss: 0.002192003885284066 2023-01-24 07:37:08.139186: step: 1904/530, loss: 0.006345229689031839 2023-01-24 07:37:09.212129: step: 1908/530, loss: 0.003066601697355509 2023-01-24 07:37:10.268360: step: 1912/530, loss: 0.000866037153173238 2023-01-24 07:37:11.306814: step: 1916/530, loss: 0.004744301084429026 2023-01-24 07:37:12.355739: step: 1920/530, loss: 0.004265100695192814 2023-01-24 07:37:13.411566: step: 1924/530, loss: 0.007012082729488611 2023-01-24 07:37:14.449417: step: 1928/530, loss: 0.0028661706019192934 2023-01-24 07:37:15.494925: step: 1932/530, loss: 0.004779900424182415 2023-01-24 07:37:16.530589: step: 1936/530, loss: 0.0011881329119205475 2023-01-24 07:37:17.580131: step: 1940/530, loss: 0.0048606423661112785 2023-01-24 07:37:18.620859: step: 1944/530, loss: 0.0021390379406511784 2023-01-24 07:37:19.681142: step: 1948/530, loss: 0.0009323130361735821 2023-01-24 07:37:20.712219: step: 1952/530, loss: 0.007452195044606924 2023-01-24 07:37:21.759808: step: 1956/530, loss: 0.008301799185574055 2023-01-24 07:37:22.813990: step: 1960/530, loss: 0.0032623056322336197 2023-01-24 07:37:23.867139: step: 1964/530, loss: 0.01720890775322914 2023-01-24 07:37:24.926513: step: 1968/530, loss: 0.0022893399000167847 2023-01-24 07:37:25.957568: step: 1972/530, loss: 0.000980921322479844 2023-01-24 07:37:26.997747: step: 1976/530, loss: 0.007523497100919485 2023-01-24 07:37:28.050555: step: 1980/530, loss: 0.001996350474655628 2023-01-24 07:37:29.099173: step: 1984/530, loss: 0.0012559270253404975 2023-01-24 07:37:30.156531: step: 1988/530, loss: 0.0014231265522539616 2023-01-24 07:37:31.201962: step: 1992/530, loss: 0.0010474895825609565 2023-01-24 07:37:32.228685: step: 1996/530, loss: 2.2794338292442262e-06 2023-01-24 07:37:33.269543: step: 2000/530, loss: 0.005295241251587868 2023-01-24 07:37:34.321941: step: 2004/530, loss: 0.005369522608816624 2023-01-24 07:37:35.371761: step: 2008/530, loss: 0.011288786306977272 2023-01-24 07:37:36.407834: step: 2012/530, loss: 0.0031512388959527016 2023-01-24 07:37:37.440556: step: 2016/530, loss: 0.013702718541026115 2023-01-24 07:37:38.473954: step: 2020/530, loss: 0.0023090012837201357 2023-01-24 07:37:39.523810: step: 2024/530, loss: 0.009029623121023178 2023-01-24 07:37:40.563202: step: 2028/530, loss: 0.0007019104668870568 2023-01-24 07:37:41.583216: step: 2032/530, loss: 3.0366447845153743e-06 2023-01-24 07:37:42.614029: step: 2036/530, loss: 0.011007311753928661 2023-01-24 07:37:43.643024: step: 2040/530, loss: 0.0033145921770483255 2023-01-24 07:37:44.692854: step: 2044/530, loss: 0.007975262589752674 2023-01-24 07:37:45.730160: step: 2048/530, loss: 0.005696276668459177 2023-01-24 07:37:46.764635: step: 2052/530, loss: 0.0048665269277989864 2023-01-24 07:37:47.818763: step: 2056/530, loss: 0.010040553286671638 2023-01-24 07:37:48.843952: step: 2060/530, loss: 0.004857656545937061 2023-01-24 07:37:49.888371: step: 2064/530, loss: 0.0018951552920043468 2023-01-24 07:37:50.936076: step: 2068/530, loss: 0.017786642536520958 2023-01-24 07:37:51.986758: step: 2072/530, loss: 0.0007790344534441829 2023-01-24 07:37:53.023447: step: 2076/530, loss: 0.0 2023-01-24 07:37:54.072423: step: 2080/530, loss: 0.021734651178121567 2023-01-24 07:37:55.125850: step: 2084/530, loss: 0.00227438029833138 2023-01-24 07:37:56.167673: step: 2088/530, loss: 0.002077819313853979 2023-01-24 07:37:57.206565: step: 2092/530, loss: 0.008677537553012371 2023-01-24 07:37:58.235905: step: 2096/530, loss: 0.01600026711821556 2023-01-24 07:37:59.285653: step: 2100/530, loss: 0.0011597075499594212 2023-01-24 07:38:00.321286: step: 2104/530, loss: 1.347493252978893e-05 2023-01-24 07:38:01.353008: step: 2108/530, loss: 0.006810830440372229 2023-01-24 07:38:02.398097: step: 2112/530, loss: 0.005150188226252794 2023-01-24 07:38:03.425692: step: 2116/530, loss: 0.010339801199734211 2023-01-24 07:38:04.468727: step: 2120/530, loss: 0.00022283566067926586 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3701296909492274, 'r': 0.31815702087286524, 'f1': 0.34218112244897964}, 'combined': 0.25213345864661657, 'stategy': 1, 'epoch': 13} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3768783872392822, 'r': 0.3907342102995499, 'f1': 0.38368124621472044}, 'combined': 0.2973988607023192, 'stategy': 1, 'epoch': 13} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3936708108964207, 'r': 0.3368985497424777, 'f1': 0.3630788051416886}, 'combined': 0.2675317511570337, 'stategy': 1, 'epoch': 13} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3717670621108563, 'r': 0.3686917831044246, 'f1': 0.37022303647218635}, 'combined': 0.286967138318154, 'stategy': 1, 'epoch': 13} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38297703353635176, 'r': 0.33283393047371745, 'f1': 0.35614920073025197}, 'combined': 0.26242572685386983, 'stategy': 1, 'epoch': 13} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3629184752942302, 'r': 0.36391916961949006, 'f1': 0.3634181335897248}, 'combined': 0.281692524600648, 'stategy': 1, 'epoch': 13} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 13} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 13} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 13} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 14 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 07:40:28.076496: step: 4/530, loss: 0.0016346677439287305 2023-01-24 07:40:29.143620: step: 8/530, loss: 0.003675297601148486 2023-01-24 07:40:30.181869: step: 12/530, loss: 8.963190339272842e-05 2023-01-24 07:40:31.209945: step: 16/530, loss: 0.00565005699172616 2023-01-24 07:40:32.248170: step: 20/530, loss: 0.009837971068918705 2023-01-24 07:40:33.276016: step: 24/530, loss: 0.0021390339825302362 2023-01-24 07:40:34.329163: step: 28/530, loss: 0.007885076105594635 2023-01-24 07:40:35.373819: step: 32/530, loss: 0.002843404421582818 2023-01-24 07:40:36.421664: step: 36/530, loss: 0.00521209929138422 2023-01-24 07:40:37.463052: step: 40/530, loss: 0.003777820384129882 2023-01-24 07:40:38.511579: step: 44/530, loss: 0.0025085266679525375 2023-01-24 07:40:39.556619: step: 48/530, loss: 0.004044826608151197 2023-01-24 07:40:40.605864: step: 52/530, loss: 0.018876822665333748 2023-01-24 07:40:41.651373: step: 56/530, loss: 0.005854184273630381 2023-01-24 07:40:42.678857: step: 60/530, loss: 0.0013494621962308884 2023-01-24 07:40:43.738632: step: 64/530, loss: 0.021728720515966415 2023-01-24 07:40:44.762565: step: 68/530, loss: 4.5802142267348245e-05 2023-01-24 07:40:45.818806: step: 72/530, loss: 0.004853399936109781 2023-01-24 07:40:46.854782: step: 76/530, loss: 0.0018106414936482906 2023-01-24 07:40:47.906955: step: 80/530, loss: 0.0008266663062386215 2023-01-24 07:40:48.937353: step: 84/530, loss: 0.005835749674588442 2023-01-24 07:40:49.971626: step: 88/530, loss: 0.004660235717892647 2023-01-24 07:40:51.019340: step: 92/530, loss: 0.009952348656952381 2023-01-24 07:40:52.080978: step: 96/530, loss: 0.007610968314111233 2023-01-24 07:40:53.116064: step: 100/530, loss: 0.0013420917093753815 2023-01-24 07:40:54.158633: step: 104/530, loss: 0.0026530746836215258 2023-01-24 07:40:55.207244: step: 108/530, loss: 0.003011272056028247 2023-01-24 07:40:56.246438: step: 112/530, loss: 0.02391926944255829 2023-01-24 07:40:57.290007: step: 116/530, loss: 0.00021972099784761667 2023-01-24 07:40:58.328243: step: 120/530, loss: 0.002886492758989334 2023-01-24 07:40:59.363847: step: 124/530, loss: 0.006241063587367535 2023-01-24 07:41:00.404680: step: 128/530, loss: 0.00011348125553922728 2023-01-24 07:41:01.438895: step: 132/530, loss: 0.006708416156470776 2023-01-24 07:41:02.483375: step: 136/530, loss: 0.024093803018331528 2023-01-24 07:41:03.526966: step: 140/530, loss: 0.00023168597545009106 2023-01-24 07:41:04.569980: step: 144/530, loss: 0.0026332861743867397 2023-01-24 07:41:05.604495: step: 148/530, loss: 0.0036725481040775776 2023-01-24 07:41:06.651189: step: 152/530, loss: 0.004245490301400423 2023-01-24 07:41:07.709711: step: 156/530, loss: 0.0014050767058506608 2023-01-24 07:41:08.751111: step: 160/530, loss: 0.019012991338968277 2023-01-24 07:41:09.785238: step: 164/530, loss: 0.00023355062876362354 2023-01-24 07:41:10.828456: step: 168/530, loss: 0.041325975209474564 2023-01-24 07:41:11.886350: step: 172/530, loss: 0.0006953369593247771 2023-01-24 07:41:12.916615: step: 176/530, loss: 0.043282415717840195 2023-01-24 07:41:13.952067: step: 180/530, loss: 0.00044354505371302366 2023-01-24 07:41:14.990028: step: 184/530, loss: 0.0016363575123250484 2023-01-24 07:41:16.031933: step: 188/530, loss: 0.0019133525202050805 2023-01-24 07:41:17.078538: step: 192/530, loss: 0.005224434658885002 2023-01-24 07:41:18.128314: step: 196/530, loss: 0.0006499649025499821 2023-01-24 07:41:19.172473: step: 200/530, loss: 0.0036496578250080347 2023-01-24 07:41:20.211899: step: 204/530, loss: 0.0025979732163250446 2023-01-24 07:41:21.267032: step: 208/530, loss: 0.0006325413123704493 2023-01-24 07:41:22.317055: step: 212/530, loss: 0.024446314200758934 2023-01-24 07:41:23.354686: step: 216/530, loss: 0.000326610985212028 2023-01-24 07:41:24.404070: step: 220/530, loss: 0.0028669715393334627 2023-01-24 07:41:25.439197: step: 224/530, loss: 0.01616206020116806 2023-01-24 07:41:26.473470: step: 228/530, loss: 0.003300365526229143 2023-01-24 07:41:27.516713: step: 232/530, loss: 0.0007692713406868279 2023-01-24 07:41:28.566810: step: 236/530, loss: 0.006896074861288071 2023-01-24 07:41:29.599680: step: 240/530, loss: 0.0038489573635160923 2023-01-24 07:41:30.629910: step: 244/530, loss: 0.003974266815930605 2023-01-24 07:41:31.665285: step: 248/530, loss: 0.0008489040192216635 2023-01-24 07:41:32.708278: step: 252/530, loss: 0.005472026765346527 2023-01-24 07:41:33.738131: step: 256/530, loss: 3.281903673268971e-07 2023-01-24 07:41:34.786892: step: 260/530, loss: 0.030663231387734413 2023-01-24 07:41:35.832097: step: 264/530, loss: 0.0011019647354260087 2023-01-24 07:41:36.880114: step: 268/530, loss: 0.009593290276825428 2023-01-24 07:41:37.913134: step: 272/530, loss: 0.0049520437605679035 2023-01-24 07:41:38.966394: step: 276/530, loss: 0.003528180532157421 2023-01-24 07:41:40.006066: step: 280/530, loss: 0.001853889785706997 2023-01-24 07:41:41.030602: step: 284/530, loss: 0.0008176437695510685 2023-01-24 07:41:42.084388: step: 288/530, loss: 0.0020257695578038692 2023-01-24 07:41:43.129287: step: 292/530, loss: 0.001921321265399456 2023-01-24 07:41:44.179639: step: 296/530, loss: 0.010214938782155514 2023-01-24 07:41:45.234499: step: 300/530, loss: 0.002811092184856534 2023-01-24 07:41:46.270187: step: 304/530, loss: 0.00010787619248731062 2023-01-24 07:41:47.315281: step: 308/530, loss: 0.0029250311199575663 2023-01-24 07:41:48.360707: step: 312/530, loss: 0.0023454746697098017 2023-01-24 07:41:49.398842: step: 316/530, loss: 0.012640808708965778 2023-01-24 07:41:50.456681: step: 320/530, loss: 0.0015858152182772756 2023-01-24 07:41:51.502941: step: 324/530, loss: 0.0035949964076280594 2023-01-24 07:41:52.548618: step: 328/530, loss: 0.005279530771076679 2023-01-24 07:41:53.597985: step: 332/530, loss: 0.008063623681664467 2023-01-24 07:41:54.642000: step: 336/530, loss: 0.000725615827832371 2023-01-24 07:41:55.699390: step: 340/530, loss: 0.00016533599409740418 2023-01-24 07:41:56.762577: step: 344/530, loss: 0.0020527879241853952 2023-01-24 07:41:57.798270: step: 348/530, loss: 0.00041898328345268965 2023-01-24 07:41:58.844476: step: 352/530, loss: 0.0023069726303219795 2023-01-24 07:41:59.898461: step: 356/530, loss: 0.006121960002928972 2023-01-24 07:42:00.928198: step: 360/530, loss: 1.2996922123420518e-05 2023-01-24 07:42:01.964341: step: 364/530, loss: 2.8845883207395673e-05 2023-01-24 07:42:03.002972: step: 368/530, loss: 0.0035502160899341106 2023-01-24 07:42:04.048759: step: 372/530, loss: 0.00973084382712841 2023-01-24 07:42:05.097581: step: 376/530, loss: 0.0008423366816714406 2023-01-24 07:42:06.139933: step: 380/530, loss: 0.0028338225092738867 2023-01-24 07:42:07.182774: step: 384/530, loss: 0.0005899100797250867 2023-01-24 07:42:08.243614: step: 388/530, loss: 0.010503212921321392 2023-01-24 07:42:09.285975: step: 392/530, loss: 0.00513524329289794 2023-01-24 07:42:10.319180: step: 396/530, loss: 0.016411567106842995 2023-01-24 07:42:11.350597: step: 400/530, loss: 0.00012324421550147235 2023-01-24 07:42:12.400191: step: 404/530, loss: 0.005968338809907436 2023-01-24 07:42:13.447080: step: 408/530, loss: 0.0038618259131908417 2023-01-24 07:42:14.484392: step: 412/530, loss: 0.009258364327251911 2023-01-24 07:42:15.538548: step: 416/530, loss: 0.021530913189053535 2023-01-24 07:42:16.583793: step: 420/530, loss: 0.007830331102013588 2023-01-24 07:42:17.631851: step: 424/530, loss: 0.007883569225668907 2023-01-24 07:42:18.683786: step: 428/530, loss: 0.01603441871702671 2023-01-24 07:42:19.722584: step: 432/530, loss: 0.008814103901386261 2023-01-24 07:42:20.763056: step: 436/530, loss: 0.0035951256286352873 2023-01-24 07:42:21.807734: step: 440/530, loss: 0.00854410044848919 2023-01-24 07:42:22.861113: step: 444/530, loss: 0.0014864866388961673 2023-01-24 07:42:23.919091: step: 448/530, loss: 0.002587459748610854 2023-01-24 07:42:24.951554: step: 452/530, loss: 0.00239950162358582 2023-01-24 07:42:25.980453: step: 456/530, loss: 4.5807395508745685e-05 2023-01-24 07:42:26.998049: step: 460/530, loss: 0.0013485102681443095 2023-01-24 07:42:28.034627: step: 464/530, loss: 0.0008352117147296667 2023-01-24 07:42:29.088046: step: 468/530, loss: 0.01152646541595459 2023-01-24 07:42:30.130344: step: 472/530, loss: 0.021400773897767067 2023-01-24 07:42:31.172671: step: 476/530, loss: 0.0020851807203143835 2023-01-24 07:42:32.240078: step: 480/530, loss: 0.006133920978754759 2023-01-24 07:42:33.289018: step: 484/530, loss: 0.021603532135486603 2023-01-24 07:42:34.341734: step: 488/530, loss: 0.001309685525484383 2023-01-24 07:42:35.393814: step: 492/530, loss: 0.0016548128332942724 2023-01-24 07:42:36.429432: step: 496/530, loss: 8.88724607648328e-05 2023-01-24 07:42:37.465954: step: 500/530, loss: 0.0006548142991960049 2023-01-24 07:42:38.518847: step: 504/530, loss: 0.0004508278507273644 2023-01-24 07:42:39.562316: step: 508/530, loss: 0.0 2023-01-24 07:42:40.615408: step: 512/530, loss: 0.006211565341800451 2023-01-24 07:42:41.653037: step: 516/530, loss: 0.0003564735525287688 2023-01-24 07:42:42.694104: step: 520/530, loss: 0.0068017481826245785 2023-01-24 07:42:43.744672: step: 524/530, loss: 0.00040756972157396376 2023-01-24 07:42:44.775304: step: 528/530, loss: 0.0023978622630238533 2023-01-24 07:42:45.804569: step: 532/530, loss: 0.005935546476393938 2023-01-24 07:42:46.851451: step: 536/530, loss: 0.017470233142375946 2023-01-24 07:42:47.895764: step: 540/530, loss: 0.009147955104708672 2023-01-24 07:42:48.929809: step: 544/530, loss: 0.0031279607210308313 2023-01-24 07:42:49.965955: step: 548/530, loss: 0.0004049708950333297 2023-01-24 07:42:51.013455: step: 552/530, loss: 0.0024942634627223015 2023-01-24 07:42:52.064060: step: 556/530, loss: 0.012339996173977852 2023-01-24 07:42:53.105924: step: 560/530, loss: 0.0007899929187260568 2023-01-24 07:42:54.149573: step: 564/530, loss: 0.0006798647809773684 2023-01-24 07:42:55.199864: step: 568/530, loss: 0.0012958283768966794 2023-01-24 07:42:56.244866: step: 572/530, loss: 0.005314614158123732 2023-01-24 07:42:57.294007: step: 576/530, loss: 1.1772711332014296e-05 2023-01-24 07:42:58.321376: step: 580/530, loss: 0.0008427457069046795 2023-01-24 07:42:59.369736: step: 584/530, loss: 0.0007043863879516721 2023-01-24 07:43:00.420811: step: 588/530, loss: 0.006046108435839415 2023-01-24 07:43:01.447568: step: 592/530, loss: 0.0016927807591855526 2023-01-24 07:43:02.501503: step: 596/530, loss: 0.009806297719478607 2023-01-24 07:43:03.548315: step: 600/530, loss: 0.0049317367374897 2023-01-24 07:43:04.597303: step: 604/530, loss: 0.0012931310338899493 2023-01-24 07:43:05.640122: step: 608/530, loss: 0.02182329073548317 2023-01-24 07:43:06.680822: step: 612/530, loss: 0.0027955302502959967 2023-01-24 07:43:07.722995: step: 616/530, loss: 0.0018680758075788617 2023-01-24 07:43:08.752190: step: 620/530, loss: 0.00029663185705430806 2023-01-24 07:43:09.790817: step: 624/530, loss: 0.002389618894085288 2023-01-24 07:43:10.837053: step: 628/530, loss: 0.006171109154820442 2023-01-24 07:43:11.894258: step: 632/530, loss: 0.0007514026365242898 2023-01-24 07:43:12.937383: step: 636/530, loss: 0.003579250071197748 2023-01-24 07:43:13.991820: step: 640/530, loss: 0.0014014053158462048 2023-01-24 07:43:15.038373: step: 644/530, loss: 0.0031395924743264914 2023-01-24 07:43:16.084808: step: 648/530, loss: 0.001203692751005292 2023-01-24 07:43:17.136123: step: 652/530, loss: 0.002001269022002816 2023-01-24 07:43:18.162539: step: 656/530, loss: 0.0008503199787810445 2023-01-24 07:43:19.200002: step: 660/530, loss: 0.0016651725163683295 2023-01-24 07:43:20.243724: step: 664/530, loss: 0.0044419714249670506 2023-01-24 07:43:21.275444: step: 668/530, loss: 0.0044181267730891705 2023-01-24 07:43:22.325792: step: 672/530, loss: 0.0015515610575675964 2023-01-24 07:43:23.380331: step: 676/530, loss: 1.1240268577239476e-05 2023-01-24 07:43:24.414242: step: 680/530, loss: 0.0005631298990920186 2023-01-24 07:43:25.466046: step: 684/530, loss: 0.0015676140319555998 2023-01-24 07:43:26.506999: step: 688/530, loss: 0.0007023405050858855 2023-01-24 07:43:27.556216: step: 692/530, loss: 0.00863282848149538 2023-01-24 07:43:28.592172: step: 696/530, loss: 0.0004379982710815966 2023-01-24 07:43:29.644734: step: 700/530, loss: 0.005205802619457245 2023-01-24 07:43:30.673584: step: 704/530, loss: 0.003251198213547468 2023-01-24 07:43:31.707140: step: 708/530, loss: 0.0013841241598129272 2023-01-24 07:43:32.743457: step: 712/530, loss: 0.003165752161294222 2023-01-24 07:43:33.803526: step: 716/530, loss: 0.0013279749546200037 2023-01-24 07:43:34.845153: step: 720/530, loss: 0.0034479363821446896 2023-01-24 07:43:35.914762: step: 724/530, loss: 0.0029910055454820395 2023-01-24 07:43:36.950041: step: 728/530, loss: 0.0004792314430233091 2023-01-24 07:43:38.015248: step: 732/530, loss: 0.0015904501779004931 2023-01-24 07:43:39.046836: step: 736/530, loss: 0.006513257510960102 2023-01-24 07:43:40.098762: step: 740/530, loss: 0.00045964971650391817 2023-01-24 07:43:41.135089: step: 744/530, loss: 1.1577099030546378e-06 2023-01-24 07:43:42.178451: step: 748/530, loss: 0.00016964190581347793 2023-01-24 07:43:43.230088: step: 752/530, loss: 0.00014626690244767815 2023-01-24 07:43:44.278935: step: 756/530, loss: 0.0017723914934322238 2023-01-24 07:43:45.331059: step: 760/530, loss: 0.0031594065949320793 2023-01-24 07:43:46.373089: step: 764/530, loss: 0.0025188724976032972 2023-01-24 07:43:47.407672: step: 768/530, loss: 0.0005355093744583428 2023-01-24 07:43:48.470080: step: 772/530, loss: 0.0029823577497154474 2023-01-24 07:43:49.520598: step: 776/530, loss: 0.0007006157538853586 2023-01-24 07:43:50.568725: step: 780/530, loss: 0.001940453890711069 2023-01-24 07:43:51.611671: step: 784/530, loss: 0.0003366061137057841 2023-01-24 07:43:52.664601: step: 788/530, loss: 0.002615744946524501 2023-01-24 07:43:53.717547: step: 792/530, loss: 0.003225903259590268 2023-01-24 07:43:54.758049: step: 796/530, loss: 0.0014087334275245667 2023-01-24 07:43:55.798860: step: 800/530, loss: 0.0014808470150455832 2023-01-24 07:43:56.845320: step: 804/530, loss: 0.00101218291092664 2023-01-24 07:43:57.892075: step: 808/530, loss: 0.000100733719591517 2023-01-24 07:43:58.938854: step: 812/530, loss: 0.00043810647912323475 2023-01-24 07:43:59.981596: step: 816/530, loss: 0.0033638705499470234 2023-01-24 07:44:01.028427: step: 820/530, loss: 0.0016776984557509422 2023-01-24 07:44:02.055792: step: 824/530, loss: 0.0011634697439149022 2023-01-24 07:44:03.138227: step: 828/530, loss: 0.006496155634522438 2023-01-24 07:44:04.180192: step: 832/530, loss: 0.009308735840022564 2023-01-24 07:44:05.253454: step: 836/530, loss: 0.001778215984813869 2023-01-24 07:44:06.307665: step: 840/530, loss: 0.0025846268981695175 2023-01-24 07:44:07.354508: step: 844/530, loss: 0.031112458556890488 2023-01-24 07:44:08.391194: step: 848/530, loss: 0.0006541639450006187 2023-01-24 07:44:09.436427: step: 852/530, loss: 0.00017527453019283712 2023-01-24 07:44:10.483210: step: 856/530, loss: 0.0044852364808321 2023-01-24 07:44:11.531093: step: 860/530, loss: 0.005102625582367182 2023-01-24 07:44:12.590816: step: 864/530, loss: 0.0032032590825110674 2023-01-24 07:44:13.650549: step: 868/530, loss: 0.004433238413184881 2023-01-24 07:44:14.681356: step: 872/530, loss: 0.0007703463779762387 2023-01-24 07:44:15.726371: step: 876/530, loss: 0.003734318073838949 2023-01-24 07:44:16.773310: step: 880/530, loss: 0.011195659637451172 2023-01-24 07:44:17.810064: step: 884/530, loss: 0.010753174312412739 2023-01-24 07:44:18.839460: step: 888/530, loss: 0.0008762682555243373 2023-01-24 07:44:19.902543: step: 892/530, loss: 0.004485843703150749 2023-01-24 07:44:20.945216: step: 896/530, loss: 0.0036895328667014837 2023-01-24 07:44:21.990661: step: 900/530, loss: 0.00019181902462150902 2023-01-24 07:44:23.030442: step: 904/530, loss: 0.0001848454267019406 2023-01-24 07:44:24.077012: step: 908/530, loss: 0.0006472284439951181 2023-01-24 07:44:25.130170: step: 912/530, loss: 0.0056353467516601086 2023-01-24 07:44:26.192323: step: 916/530, loss: 4.909193648927612e-06 2023-01-24 07:44:27.228608: step: 920/530, loss: 0.016644641757011414 2023-01-24 07:44:28.253173: step: 924/530, loss: 0.0016755490796640515 2023-01-24 07:44:29.279263: step: 928/530, loss: 8.314847218571231e-05 2023-01-24 07:44:30.333064: step: 932/530, loss: 0.003018605289980769 2023-01-24 07:44:31.387996: step: 936/530, loss: 0.004783610347658396 2023-01-24 07:44:32.410817: step: 940/530, loss: 0.0028378639835864305 2023-01-24 07:44:33.479384: step: 944/530, loss: 0.008646524511277676 2023-01-24 07:44:34.526869: step: 948/530, loss: 0.0016284373123198748 2023-01-24 07:44:35.552201: step: 952/530, loss: 0.006739044561982155 2023-01-24 07:44:36.605701: step: 956/530, loss: 0.0017372049624100327 2023-01-24 07:44:37.642349: step: 960/530, loss: 0.003786595305427909 2023-01-24 07:44:38.678156: step: 964/530, loss: 0.00020437585772015154 2023-01-24 07:44:39.725468: step: 968/530, loss: 0.0005733373109251261 2023-01-24 07:44:40.765526: step: 972/530, loss: 7.953478780109435e-05 2023-01-24 07:44:41.804586: step: 976/530, loss: 0.0005118280532769859 2023-01-24 07:44:42.849688: step: 980/530, loss: 0.004252298269420862 2023-01-24 07:44:43.890194: step: 984/530, loss: 0.0030935704708099365 2023-01-24 07:44:44.928207: step: 988/530, loss: 0.006477537099272013 2023-01-24 07:44:45.982242: step: 992/530, loss: 0.013364238664507866 2023-01-24 07:44:47.021795: step: 996/530, loss: 0.0014077663654461503 2023-01-24 07:44:48.060347: step: 1000/530, loss: 0.003003102960065007 2023-01-24 07:44:49.100809: step: 1004/530, loss: 0.0015073404647409916 2023-01-24 07:44:50.145624: step: 1008/530, loss: 0.0008681311155669391 2023-01-24 07:44:51.180524: step: 1012/530, loss: 0.002079136436805129 2023-01-24 07:44:52.211385: step: 1016/530, loss: 0.0004659243568312377 2023-01-24 07:44:53.259842: step: 1020/530, loss: 0.005345776677131653 2023-01-24 07:44:54.289010: step: 1024/530, loss: 0.0021580331958830357 2023-01-24 07:44:55.318447: step: 1028/530, loss: 0.007207970600575209 2023-01-24 07:44:56.350364: step: 1032/530, loss: 2.518750261515379e-05 2023-01-24 07:44:57.380254: step: 1036/530, loss: 0.005891777109354734 2023-01-24 07:44:58.415213: step: 1040/530, loss: 0.01195522677153349 2023-01-24 07:44:59.452536: step: 1044/530, loss: 0.00037829522625543177 2023-01-24 07:45:00.487526: step: 1048/530, loss: 0.0003775592485908419 2023-01-24 07:45:01.517042: step: 1052/530, loss: 0.0024395822547376156 2023-01-24 07:45:02.550340: step: 1056/530, loss: 0.0011896878713741899 2023-01-24 07:45:03.631205: step: 1060/530, loss: 0.0027918650303035975 2023-01-24 07:45:04.674663: step: 1064/530, loss: 0.00016347611381206661 2023-01-24 07:45:05.711671: step: 1068/530, loss: 0.0054471734911203384 2023-01-24 07:45:06.755408: step: 1072/530, loss: 0.0013330650981515646 2023-01-24 07:45:07.806096: step: 1076/530, loss: 0.0008108783513307571 2023-01-24 07:45:08.841870: step: 1080/530, loss: 0.002921827370300889 2023-01-24 07:45:09.911465: step: 1084/530, loss: 0.0006199057679623365 2023-01-24 07:45:10.946362: step: 1088/530, loss: 0.007223739754408598 2023-01-24 07:45:12.010161: step: 1092/530, loss: 0.00037254771450534463 2023-01-24 07:45:13.059848: step: 1096/530, loss: 0.006985718384385109 2023-01-24 07:45:14.097181: step: 1100/530, loss: 0.00378967821598053 2023-01-24 07:45:15.135720: step: 1104/530, loss: 0.009589145891368389 2023-01-24 07:45:16.200651: step: 1108/530, loss: 2.0393277736729942e-05 2023-01-24 07:45:17.246718: step: 1112/530, loss: 0.0083364462479949 2023-01-24 07:45:18.282862: step: 1116/530, loss: 0.0023572510108351707 2023-01-24 07:45:19.339005: step: 1120/530, loss: 0.00036582129541784525 2023-01-24 07:45:20.385266: step: 1124/530, loss: 0.009437032975256443 2023-01-24 07:45:21.440963: step: 1128/530, loss: 0.0021231600549072027 2023-01-24 07:45:22.502300: step: 1132/530, loss: 0.0014759768964722753 2023-01-24 07:45:23.566305: step: 1136/530, loss: 0.0016669026808813214 2023-01-24 07:45:24.626464: step: 1140/530, loss: 0.000987692386843264 2023-01-24 07:45:25.682349: step: 1144/530, loss: 0.0006102340994402766 2023-01-24 07:45:26.724170: step: 1148/530, loss: 0.0050750416703522205 2023-01-24 07:45:27.772779: step: 1152/530, loss: 0.004148300737142563 2023-01-24 07:45:28.826052: step: 1156/530, loss: 8.818758215056732e-05 2023-01-24 07:45:29.879911: step: 1160/530, loss: 0.00031680401298217475 2023-01-24 07:45:30.924780: step: 1164/530, loss: 0.005485094152390957 2023-01-24 07:45:31.959723: step: 1168/530, loss: 0.001176755758933723 2023-01-24 07:45:33.009845: step: 1172/530, loss: 0.01726360246539116 2023-01-24 07:45:34.056309: step: 1176/530, loss: 0.00626567006111145 2023-01-24 07:45:35.105135: step: 1180/530, loss: 0.005810895003378391 2023-01-24 07:45:36.140838: step: 1184/530, loss: 0.00011842435196740553 2023-01-24 07:45:37.201969: step: 1188/530, loss: 0.03415227681398392 2023-01-24 07:45:38.248060: step: 1192/530, loss: 0.004371089395135641 2023-01-24 07:45:39.292599: step: 1196/530, loss: 0.013393866829574108 2023-01-24 07:45:40.348756: step: 1200/530, loss: 0.003492301795631647 2023-01-24 07:45:41.391444: step: 1204/530, loss: 0.027621056884527206 2023-01-24 07:45:42.456468: step: 1208/530, loss: 0.006727175787091255 2023-01-24 07:45:43.509509: step: 1212/530, loss: 0.016643723472952843 2023-01-24 07:45:44.557037: step: 1216/530, loss: 0.0009906409541144967 2023-01-24 07:45:45.599417: step: 1220/530, loss: 0.002239114372059703 2023-01-24 07:45:46.635213: step: 1224/530, loss: 0.002180964918807149 2023-01-24 07:45:47.676873: step: 1228/530, loss: 0.007498615887016058 2023-01-24 07:45:48.718823: step: 1232/530, loss: 7.95206051407149e-06 2023-01-24 07:45:49.762634: step: 1236/530, loss: 0.0028945051599293947 2023-01-24 07:45:50.803354: step: 1240/530, loss: 0.0017162695294246078 2023-01-24 07:45:51.860690: step: 1244/530, loss: 0.0003706467105075717 2023-01-24 07:45:52.908278: step: 1248/530, loss: 0.0062610381282866 2023-01-24 07:45:53.952079: step: 1252/530, loss: 0.008994611911475658 2023-01-24 07:45:54.999694: step: 1256/530, loss: 0.001414175727404654 2023-01-24 07:45:56.037229: step: 1260/530, loss: 0.010115209966897964 2023-01-24 07:45:57.082618: step: 1264/530, loss: 0.002679947530850768 2023-01-24 07:45:58.123016: step: 1268/530, loss: 0.0018600476905703545 2023-01-24 07:45:59.161240: step: 1272/530, loss: 0.0004839859320782125 2023-01-24 07:46:00.207352: step: 1276/530, loss: 0.0006661342922598124 2023-01-24 07:46:01.264386: step: 1280/530, loss: 0.0004133051843382418 2023-01-24 07:46:02.310770: step: 1284/530, loss: 0.01169020589441061 2023-01-24 07:46:03.380949: step: 1288/530, loss: 0.0038833527360111475 2023-01-24 07:46:04.410890: step: 1292/530, loss: 0.0001987712166737765 2023-01-24 07:46:05.451665: step: 1296/530, loss: 0.004742329008877277 2023-01-24 07:46:06.495541: step: 1300/530, loss: 0.00645976047962904 2023-01-24 07:46:07.516172: step: 1304/530, loss: 0.0025145760737359524 2023-01-24 07:46:08.553867: step: 1308/530, loss: 0.00340718450024724 2023-01-24 07:46:09.583190: step: 1312/530, loss: 3.2552591164858313e-06 2023-01-24 07:46:10.620482: step: 1316/530, loss: 3.858712443616241e-05 2023-01-24 07:46:11.679927: step: 1320/530, loss: 0.10316751897335052 2023-01-24 07:46:12.715693: step: 1324/530, loss: 0.01041797362267971 2023-01-24 07:46:13.765288: step: 1328/530, loss: 0.021871104836463928 2023-01-24 07:46:14.804996: step: 1332/530, loss: 0.004269781522452831 2023-01-24 07:46:15.844597: step: 1336/530, loss: 0.0006900060107000172 2023-01-24 07:46:16.882676: step: 1340/530, loss: 0.007187479175627232 2023-01-24 07:46:17.906345: step: 1344/530, loss: 0.0028446244541555643 2023-01-24 07:46:18.979023: step: 1348/530, loss: 0.027358926832675934 2023-01-24 07:46:20.019471: step: 1352/530, loss: 0.0019490565173327923 2023-01-24 07:46:21.065768: step: 1356/530, loss: 0.01167477946728468 2023-01-24 07:46:22.123229: step: 1360/530, loss: 0.008325232192873955 2023-01-24 07:46:23.168660: step: 1364/530, loss: 0.006251713261008263 2023-01-24 07:46:24.231104: step: 1368/530, loss: 1.9401213648961857e-06 2023-01-24 07:46:25.284532: step: 1372/530, loss: 0.005534324795007706 2023-01-24 07:46:26.346955: step: 1376/530, loss: 0.01440263818949461 2023-01-24 07:46:27.402046: step: 1380/530, loss: 0.008540664799511433 2023-01-24 07:46:28.460703: step: 1384/530, loss: 0.0006516218418255448 2023-01-24 07:46:29.523578: step: 1388/530, loss: 0.02173752896487713 2023-01-24 07:46:30.564276: step: 1392/530, loss: 0.0027636161539703608 2023-01-24 07:46:31.594560: step: 1396/530, loss: 0.00596939492970705 2023-01-24 07:46:32.636659: step: 1400/530, loss: 0.010441185906529427 2023-01-24 07:46:33.675521: step: 1404/530, loss: 0.014863350428640842 2023-01-24 07:46:34.724611: step: 1408/530, loss: 0.001951046520844102 2023-01-24 07:46:35.777155: step: 1412/530, loss: 0.005583907011896372 2023-01-24 07:46:36.805278: step: 1416/530, loss: 0.002855088096112013 2023-01-24 07:46:37.833130: step: 1420/530, loss: 0.0049894885160028934 2023-01-24 07:46:38.877007: step: 1424/530, loss: 0.0006128315581008792 2023-01-24 07:46:39.907060: step: 1428/530, loss: 0.00333867478184402 2023-01-24 07:46:40.954136: step: 1432/530, loss: 0.016556404531002045 2023-01-24 07:46:42.003346: step: 1436/530, loss: 0.015891462564468384 2023-01-24 07:46:43.040479: step: 1440/530, loss: 0.0013385652564466 2023-01-24 07:46:44.072473: step: 1444/530, loss: 0.0011590908979997039 2023-01-24 07:46:45.104425: step: 1448/530, loss: 2.591070256130479e-07 2023-01-24 07:46:46.149518: step: 1452/530, loss: 0.0024300680961459875 2023-01-24 07:46:47.195522: step: 1456/530, loss: 0.0007945887045934796 2023-01-24 07:46:48.230487: step: 1460/530, loss: 0.0009450240177102387 2023-01-24 07:46:49.264107: step: 1464/530, loss: 0.01220585498958826 2023-01-24 07:46:50.290699: step: 1468/530, loss: 0.00014535269292537123 2023-01-24 07:46:51.322460: step: 1472/530, loss: 0.003059492679312825 2023-01-24 07:46:52.379449: step: 1476/530, loss: 0.005597684998065233 2023-01-24 07:46:53.413250: step: 1480/530, loss: 0.0032327519729733467 2023-01-24 07:46:54.459582: step: 1484/530, loss: 0.005534071940928698 2023-01-24 07:46:55.505353: step: 1488/530, loss: 0.009242421016097069 2023-01-24 07:46:56.541676: step: 1492/530, loss: 0.0017967646708711982 2023-01-24 07:46:57.563995: step: 1496/530, loss: 0.0014293482527136803 2023-01-24 07:46:58.613168: step: 1500/530, loss: 0.0018570758402347565 2023-01-24 07:46:59.649845: step: 1504/530, loss: 0.0012327064760029316 2023-01-24 07:47:00.701421: step: 1508/530, loss: 0.0006538216257467866 2023-01-24 07:47:01.746663: step: 1512/530, loss: 0.002998492680490017 2023-01-24 07:47:02.779163: step: 1516/530, loss: 0.0007727608899585903 2023-01-24 07:47:03.825114: step: 1520/530, loss: 0.0029330395627766848 2023-01-24 07:47:04.875786: step: 1524/530, loss: 0.00407476257532835 2023-01-24 07:47:05.918334: step: 1528/530, loss: 0.0021292457822710276 2023-01-24 07:47:06.951182: step: 1532/530, loss: 0.00473290029913187 2023-01-24 07:47:08.001841: step: 1536/530, loss: 0.007184077054262161 2023-01-24 07:47:09.049446: step: 1540/530, loss: 0.005728963762521744 2023-01-24 07:47:10.075031: step: 1544/530, loss: 0.00018021403229795396 2023-01-24 07:47:11.124817: step: 1548/530, loss: 0.03402888774871826 2023-01-24 07:47:12.162239: step: 1552/530, loss: 0.005641507916152477 2023-01-24 07:47:13.213574: step: 1556/530, loss: 0.006954981479793787 2023-01-24 07:47:14.260929: step: 1560/530, loss: 0.002068853471428156 2023-01-24 07:47:15.293030: step: 1564/530, loss: 7.593764166813344e-05 2023-01-24 07:47:16.362144: step: 1568/530, loss: 0.003554497379809618 2023-01-24 07:47:17.406410: step: 1572/530, loss: 0.0005778810009360313 2023-01-24 07:47:18.467354: step: 1576/530, loss: 0.0022768541239202023 2023-01-24 07:47:19.504291: step: 1580/530, loss: 0.0015208704862743616 2023-01-24 07:47:20.545922: step: 1584/530, loss: 0.005875979550182819 2023-01-24 07:47:21.586133: step: 1588/530, loss: 0.005047973711043596 2023-01-24 07:47:22.623575: step: 1592/530, loss: 0.011728701181709766 2023-01-24 07:47:23.676364: step: 1596/530, loss: 0.0011360831558704376 2023-01-24 07:47:24.717714: step: 1600/530, loss: 2.102630560329999e-06 2023-01-24 07:47:25.763414: step: 1604/530, loss: 0.003437940962612629 2023-01-24 07:47:26.806985: step: 1608/530, loss: 0.003398310160264373 2023-01-24 07:47:27.827116: step: 1612/530, loss: 4.358696605777368e-05 2023-01-24 07:47:28.876546: step: 1616/530, loss: 0.0004393762210384011 2023-01-24 07:47:29.959296: step: 1620/530, loss: 0.0056333960965275764 2023-01-24 07:47:31.006971: step: 1624/530, loss: 0.001232057809829712 2023-01-24 07:47:32.035978: step: 1628/530, loss: 0.005570483393967152 2023-01-24 07:47:33.080318: step: 1632/530, loss: 0.005351976025849581 2023-01-24 07:47:34.117496: step: 1636/530, loss: 0.0009466410847380757 2023-01-24 07:47:35.155950: step: 1640/530, loss: 0.0029156797099858522 2023-01-24 07:47:36.190908: step: 1644/530, loss: 0.00151121208909899 2023-01-24 07:47:37.245274: step: 1648/530, loss: 0.007095366716384888 2023-01-24 07:47:38.291330: step: 1652/530, loss: 0.0005021628458052874 2023-01-24 07:47:39.329090: step: 1656/530, loss: 8.454511407762766e-05 2023-01-24 07:47:40.392126: step: 1660/530, loss: 0.008493185043334961 2023-01-24 07:47:41.425560: step: 1664/530, loss: 0.0021600769832730293 2023-01-24 07:47:42.468871: step: 1668/530, loss: 0.004124830476939678 2023-01-24 07:47:43.511081: step: 1672/530, loss: 0.0038572305347770452 2023-01-24 07:47:44.538549: step: 1676/530, loss: 0.0003642990777734667 2023-01-24 07:47:45.592036: step: 1680/530, loss: 0.0005445689894258976 2023-01-24 07:47:46.625769: step: 1684/530, loss: 0.005153903737664223 2023-01-24 07:47:47.714288: step: 1688/530, loss: 0.007264290004968643 2023-01-24 07:47:48.758447: step: 1692/530, loss: 0.0027415661606937647 2023-01-24 07:47:49.803529: step: 1696/530, loss: 0.00010127613495569676 2023-01-24 07:47:50.849523: step: 1700/530, loss: 0.0060294982977211475 2023-01-24 07:47:51.891413: step: 1704/530, loss: 0.008547945879399776 2023-01-24 07:47:52.947019: step: 1708/530, loss: 0.00027285379474051297 2023-01-24 07:47:53.984506: step: 1712/530, loss: 0.0028091531712561846 2023-01-24 07:47:55.028737: step: 1716/530, loss: 6.0254136769799516e-05 2023-01-24 07:47:56.078655: step: 1720/530, loss: 0.003719775006175041 2023-01-24 07:47:57.126680: step: 1724/530, loss: 0.001921151066198945 2023-01-24 07:47:58.164461: step: 1728/530, loss: 0.0026825922541320324 2023-01-24 07:47:59.205547: step: 1732/530, loss: 0.00022626893769484013 2023-01-24 07:48:00.244853: step: 1736/530, loss: 0.0005456481594592333 2023-01-24 07:48:01.269555: step: 1740/530, loss: 0.00511472811922431 2023-01-24 07:48:02.310369: step: 1744/530, loss: 0.011158404871821404 2023-01-24 07:48:03.375479: step: 1748/530, loss: 5.462756234919652e-06 2023-01-24 07:48:04.419244: step: 1752/530, loss: 0.0012531798565760255 2023-01-24 07:48:05.454844: step: 1756/530, loss: 0.0013562203384935856 2023-01-24 07:48:06.490144: step: 1760/530, loss: 0.0006840457790531218 2023-01-24 07:48:07.532958: step: 1764/530, loss: 1.9554627215256914e-05 2023-01-24 07:48:08.570332: step: 1768/530, loss: 0.0064858742989599705 2023-01-24 07:48:09.610217: step: 1772/530, loss: 0.0017773398431017995 2023-01-24 07:48:10.634787: step: 1776/530, loss: 0.010962901636958122 2023-01-24 07:48:11.673737: step: 1780/530, loss: 0.0016993449535220861 2023-01-24 07:48:12.713239: step: 1784/530, loss: 0.000713059795089066 2023-01-24 07:48:13.767228: step: 1788/530, loss: 0.001429026946425438 2023-01-24 07:48:14.798342: step: 1792/530, loss: 0.0017729275859892368 2023-01-24 07:48:15.853573: step: 1796/530, loss: 0.006913549266755581 2023-01-24 07:48:16.899491: step: 1800/530, loss: 0.028466973453760147 2023-01-24 07:48:17.931523: step: 1804/530, loss: 0.005895878188312054 2023-01-24 07:48:18.971224: step: 1808/530, loss: 0.0002944791631307453 2023-01-24 07:48:20.021722: step: 1812/530, loss: 0.0014753293944522738 2023-01-24 07:48:21.054218: step: 1816/530, loss: 4.284674650989473e-05 2023-01-24 07:48:22.085563: step: 1820/530, loss: 0.004026878625154495 2023-01-24 07:48:23.112286: step: 1824/530, loss: 0.0038042047526687384 2023-01-24 07:48:24.140609: step: 1828/530, loss: 0.000867285649292171 2023-01-24 07:48:25.193393: step: 1832/530, loss: 0.004134317394345999 2023-01-24 07:48:26.236243: step: 1836/530, loss: 0.002293369034305215 2023-01-24 07:48:27.286420: step: 1840/530, loss: 0.006302934139966965 2023-01-24 07:48:28.315671: step: 1844/530, loss: 0.0001471473806304857 2023-01-24 07:48:29.357572: step: 1848/530, loss: 0.008634034544229507 2023-01-24 07:48:30.403772: step: 1852/530, loss: 0.0008669691160321236 2023-01-24 07:48:31.449251: step: 1856/530, loss: 0.0010020699119195342 2023-01-24 07:48:32.504879: step: 1860/530, loss: 0.0005832889582961798 2023-01-24 07:48:33.542441: step: 1864/530, loss: 0.010718967765569687 2023-01-24 07:48:34.583964: step: 1868/530, loss: 0.000633514893706888 2023-01-24 07:48:35.617404: step: 1872/530, loss: 0.0030884321313351393 2023-01-24 07:48:36.667750: step: 1876/530, loss: 0.004053754266351461 2023-01-24 07:48:37.706352: step: 1880/530, loss: 0.004757086746394634 2023-01-24 07:48:38.749271: step: 1884/530, loss: 0.012511016800999641 2023-01-24 07:48:39.774315: step: 1888/530, loss: 2.1465699319378473e-05 2023-01-24 07:48:40.799254: step: 1892/530, loss: 0.0010633196216076612 2023-01-24 07:48:41.850131: step: 1896/530, loss: 0.010909922420978546 2023-01-24 07:48:42.888605: step: 1900/530, loss: 0.0042119137942790985 2023-01-24 07:48:43.926225: step: 1904/530, loss: 0.0013723624870181084 2023-01-24 07:48:44.978864: step: 1908/530, loss: 5.691273327101953e-05 2023-01-24 07:48:46.013647: step: 1912/530, loss: 0.003312408924102783 2023-01-24 07:48:47.075455: step: 1916/530, loss: 0.0020297765731811523 2023-01-24 07:48:48.124287: step: 1920/530, loss: 0.018630992621183395 2023-01-24 07:48:49.167479: step: 1924/530, loss: 0.002299703424796462 2023-01-24 07:48:50.192916: step: 1928/530, loss: 0.01734558679163456 2023-01-24 07:48:51.231693: step: 1932/530, loss: 0.008692233823239803 2023-01-24 07:48:52.256029: step: 1936/530, loss: 0.009354210458695889 2023-01-24 07:48:53.294576: step: 1940/530, loss: 0.0015004929155111313 2023-01-24 07:48:54.338344: step: 1944/530, loss: 0.003547100583091378 2023-01-24 07:48:55.371822: step: 1948/530, loss: 0.0008395725744776428 2023-01-24 07:48:56.408333: step: 1952/530, loss: 0.007419206667691469 2023-01-24 07:48:57.451099: step: 1956/530, loss: 0.0030893306247889996 2023-01-24 07:48:58.503294: step: 1960/530, loss: 1.90397822734667e-05 2023-01-24 07:48:59.537376: step: 1964/530, loss: 0.0006726476131007075 2023-01-24 07:49:00.586495: step: 1968/530, loss: 0.002564217895269394 2023-01-24 07:49:01.617740: step: 1972/530, loss: 0.004953647032380104 2023-01-24 07:49:02.659272: step: 1976/530, loss: 0.00026036237250082195 2023-01-24 07:49:03.711386: step: 1980/530, loss: 0.003146646311506629 2023-01-24 07:49:04.774241: step: 1984/530, loss: 0.026527967303991318 2023-01-24 07:49:05.808070: step: 1988/530, loss: 0.003269575070589781 2023-01-24 07:49:06.866781: step: 1992/530, loss: 0.0112005565315485 2023-01-24 07:49:07.920449: step: 1996/530, loss: 0.0024370155297219753 2023-01-24 07:49:08.951315: step: 2000/530, loss: 0.0017816127510741353 2023-01-24 07:49:10.012273: step: 2004/530, loss: 0.0002463326964061707 2023-01-24 07:49:11.056934: step: 2008/530, loss: 0.025541674345731735 2023-01-24 07:49:12.091673: step: 2012/530, loss: 0.007038659881800413 2023-01-24 07:49:13.138504: step: 2016/530, loss: 0.0030720599461346865 2023-01-24 07:49:14.176976: step: 2020/530, loss: 0.01581084169447422 2023-01-24 07:49:15.218304: step: 2024/530, loss: 0.0034938957542181015 2023-01-24 07:49:16.271032: step: 2028/530, loss: 0.0050782994367182255 2023-01-24 07:49:17.324397: step: 2032/530, loss: 0.00661267526447773 2023-01-24 07:49:18.393999: step: 2036/530, loss: 0.0016580792143940926 2023-01-24 07:49:19.455256: step: 2040/530, loss: 0.0030666871462017298 2023-01-24 07:49:20.490165: step: 2044/530, loss: 0.00020061011309735477 2023-01-24 07:49:21.536141: step: 2048/530, loss: 0.0020251853857189417 2023-01-24 07:49:22.577911: step: 2052/530, loss: 0.0023325940128415823 2023-01-24 07:49:23.636894: step: 2056/530, loss: 0.004989034961909056 2023-01-24 07:49:24.676682: step: 2060/530, loss: 0.00042098373523913324 2023-01-24 07:49:25.705961: step: 2064/530, loss: 0.0002676958392839879 2023-01-24 07:49:26.751494: step: 2068/530, loss: 0.005194572266191244 2023-01-24 07:49:27.786660: step: 2072/530, loss: 0.011506150476634502 2023-01-24 07:49:28.814360: step: 2076/530, loss: 0.0025587156414985657 2023-01-24 07:49:29.870208: step: 2080/530, loss: 0.009145993739366531 2023-01-24 07:49:30.927834: step: 2084/530, loss: 0.008899924345314503 2023-01-24 07:49:31.968586: step: 2088/530, loss: 0.0058839889243245125 2023-01-24 07:49:33.015466: step: 2092/530, loss: 0.0015116475988179445 2023-01-24 07:49:34.060483: step: 2096/530, loss: 0.007068545091897249 2023-01-24 07:49:35.108154: step: 2100/530, loss: 0.004713758826255798 2023-01-24 07:49:36.159644: step: 2104/530, loss: 0.017527861520648003 2023-01-24 07:49:37.214389: step: 2108/530, loss: 0.006133155431598425 2023-01-24 07:49:38.282241: step: 2112/530, loss: 0.006350258830934763 2023-01-24 07:49:39.322471: step: 2116/530, loss: 0.0026042740792036057 2023-01-24 07:49:40.366649: step: 2120/530, loss: 0.00734981382265687 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37371404867256636, 'r': 0.32052893738140414, 'f1': 0.34508426966292133}, 'combined': 0.25427261975162624, 'stategy': 1, 'epoch': 14} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37292775203343065, 'r': 0.38869491802013817, 'f1': 0.3806481285381731}, 'combined': 0.2950478316898758, 'stategy': 1, 'epoch': 14} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3856567460317461, 'r': 0.32930841691515317, 'f1': 0.35526209972218165}, 'combined': 0.26177207347950227, 'stategy': 1, 'epoch': 14} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3726981128747585, 'r': 0.37030023898677755, 'f1': 0.3714953066091415}, 'combined': 0.28795329985971735, 'stategy': 1, 'epoch': 14} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3783300247486909, 'r': 0.329513247361763, 'f1': 0.3522382989039536}, 'combined': 0.2595440097187026, 'stategy': 1, 'epoch': 14} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3599945721881326, 'r': 0.36231071373713714, 'f1': 0.36114892949702726}, 'combined': 0.2799336199929111, 'stategy': 1, 'epoch': 14} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 14} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 14} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 14} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38720415311180817, 'r': 0.33283393047371745, 'f1': 0.35796628848907985}, 'combined': 0.26376463362353253, 'stategy': 1, 'epoch': 8} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36421427197230394, 'r': 0.3625404931489018, 'f1': 0.3633754551322019}, 'combined': 0.28165944369098905, 'stategy': 1, 'epoch': 8} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 8} ****************************** Epoch: 15 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 07:52:04.643392: step: 4/530, loss: 0.006728241220116615 2023-01-24 07:52:05.697501: step: 8/530, loss: 0.01092079933732748 2023-01-24 07:52:06.752757: step: 12/530, loss: 0.003687224816530943 2023-01-24 07:52:07.774753: step: 16/530, loss: 0.0019325496396049857 2023-01-24 07:52:08.815368: step: 20/530, loss: 0.0032276909332722425 2023-01-24 07:52:09.838579: step: 24/530, loss: 0.0020119063556194305 2023-01-24 07:52:10.887978: step: 28/530, loss: 0.003910745959728956 2023-01-24 07:52:11.922401: step: 32/530, loss: 0.007735200226306915 2023-01-24 07:52:12.959508: step: 36/530, loss: 0.0019700652919709682 2023-01-24 07:52:13.994535: step: 40/530, loss: 0.007898872718214989 2023-01-24 07:52:15.037274: step: 44/530, loss: 0.0018007050966843963 2023-01-24 07:52:16.074877: step: 48/530, loss: 0.06393536180257797 2023-01-24 07:52:17.112178: step: 52/530, loss: 0.003908275160938501 2023-01-24 07:52:18.139677: step: 56/530, loss: 0.0007549480069428682 2023-01-24 07:52:19.195773: step: 60/530, loss: 0.005105209536850452 2023-01-24 07:52:20.242710: step: 64/530, loss: 0.0015098523581400514 2023-01-24 07:52:21.283558: step: 68/530, loss: 1.981997411348857e-05 2023-01-24 07:52:22.331417: step: 72/530, loss: 0.0007663294090889394 2023-01-24 07:52:23.372971: step: 76/530, loss: 0.0018295961199328303 2023-01-24 07:52:24.415973: step: 80/530, loss: 0.003032487351447344 2023-01-24 07:52:25.452349: step: 84/530, loss: 0.005615803878754377 2023-01-24 07:52:26.515679: step: 88/530, loss: 0.000449291430413723 2023-01-24 07:52:27.556371: step: 92/530, loss: 0.002229244913905859 2023-01-24 07:52:28.589658: step: 96/530, loss: 0.0018482328159734607 2023-01-24 07:52:29.632371: step: 100/530, loss: 0.007176647428423166 2023-01-24 07:52:30.666985: step: 104/530, loss: 0.0023082057014107704 2023-01-24 07:52:31.738845: step: 108/530, loss: 0.005674582906067371 2023-01-24 07:52:32.777083: step: 112/530, loss: 0.003943182993680239 2023-01-24 07:52:33.821440: step: 116/530, loss: 0.005425735376775265 2023-01-24 07:52:34.868377: step: 120/530, loss: 0.001288491184823215 2023-01-24 07:52:35.923829: step: 124/530, loss: 0.0022611620370298624 2023-01-24 07:52:36.966070: step: 128/530, loss: 0.000500692636705935 2023-01-24 07:52:38.025722: step: 132/530, loss: 9.355145448353142e-05 2023-01-24 07:52:39.058970: step: 136/530, loss: 0.009377521462738514 2023-01-24 07:52:40.116788: step: 140/530, loss: 0.0005079037509858608 2023-01-24 07:52:41.159607: step: 144/530, loss: 0.0032796585001051426 2023-01-24 07:52:42.194931: step: 148/530, loss: 0.00315141212195158 2023-01-24 07:52:43.258264: step: 152/530, loss: 0.0002355034666834399 2023-01-24 07:52:44.302153: step: 156/530, loss: 0.006104033440351486 2023-01-24 07:52:45.349122: step: 160/530, loss: 0.005844739731401205 2023-01-24 07:52:46.402020: step: 164/530, loss: 0.003568240674212575 2023-01-24 07:52:47.424022: step: 168/530, loss: 0.0025225516874343157 2023-01-24 07:52:48.470566: step: 172/530, loss: 0.00638723885640502 2023-01-24 07:52:49.508249: step: 176/530, loss: 0.0003313054039608687 2023-01-24 07:52:50.536897: step: 180/530, loss: 0.0011914032511413097 2023-01-24 07:52:51.566129: step: 184/530, loss: 0.0013044987572357059 2023-01-24 07:52:52.601633: step: 188/530, loss: 9.945756755769253e-05 2023-01-24 07:52:53.640995: step: 192/530, loss: 6.864780516480096e-06 2023-01-24 07:52:54.679308: step: 196/530, loss: 0.002715484704822302 2023-01-24 07:52:55.717700: step: 200/530, loss: 0.0010256976820528507 2023-01-24 07:52:56.767490: step: 204/530, loss: 2.1096932414366165e-06 2023-01-24 07:52:57.801259: step: 208/530, loss: 0.008246565237641335 2023-01-24 07:52:58.844921: step: 212/530, loss: 0.012566031888127327 2023-01-24 07:52:59.892162: step: 216/530, loss: 0.0030449607875198126 2023-01-24 07:53:00.943203: step: 220/530, loss: 0.0015749752055853605 2023-01-24 07:53:01.975988: step: 224/530, loss: 0.0020285595674067736 2023-01-24 07:53:03.013410: step: 228/530, loss: 0.0001254546077689156 2023-01-24 07:53:04.079307: step: 232/530, loss: 0.005158832296729088 2023-01-24 07:53:05.118822: step: 236/530, loss: 0.00013074540765956044 2023-01-24 07:53:06.162154: step: 240/530, loss: 0.0013885352527722716 2023-01-24 07:53:07.204892: step: 244/530, loss: 0.003860518801957369 2023-01-24 07:53:08.255583: step: 248/530, loss: 0.010055194608867168 2023-01-24 07:53:09.290827: step: 252/530, loss: 0.0008981186547316611 2023-01-24 07:53:10.339021: step: 256/530, loss: 0.002441010670736432 2023-01-24 07:53:11.384952: step: 260/530, loss: 0.015143767930567265 2023-01-24 07:53:12.447619: step: 264/530, loss: 0.0032985215075314045 2023-01-24 07:53:13.501372: step: 268/530, loss: 0.02295239083468914 2023-01-24 07:53:14.540630: step: 272/530, loss: 0.00016630797472316772 2023-01-24 07:53:15.590944: step: 276/530, loss: 0.0017587675247341394 2023-01-24 07:53:16.641400: step: 280/530, loss: 0.002919380320236087 2023-01-24 07:53:17.696227: step: 284/530, loss: 0.005225224420428276 2023-01-24 07:53:18.734522: step: 288/530, loss: 0.00294761685654521 2023-01-24 07:53:19.779094: step: 292/530, loss: 0.004382021725177765 2023-01-24 07:53:20.829296: step: 296/530, loss: 0.00557662034407258 2023-01-24 07:53:21.873969: step: 300/530, loss: 0.004200521856546402 2023-01-24 07:53:22.922457: step: 304/530, loss: 0.005391261074692011 2023-01-24 07:53:23.975143: step: 308/530, loss: 0.0035750262904912233 2023-01-24 07:53:25.009139: step: 312/530, loss: 0.012020302005112171 2023-01-24 07:53:26.037059: step: 316/530, loss: 0.0011893701739609241 2023-01-24 07:53:27.078922: step: 320/530, loss: 0.004335054196417332 2023-01-24 07:53:28.138649: step: 324/530, loss: 0.004338924307376146 2023-01-24 07:53:29.166382: step: 328/530, loss: 0.0004685973981395364 2023-01-24 07:53:30.208670: step: 332/530, loss: 0.0003985729708801955 2023-01-24 07:53:31.255375: step: 336/530, loss: 0.0013948632404208183 2023-01-24 07:53:32.294339: step: 340/530, loss: 0.006275718100368977 2023-01-24 07:53:33.334406: step: 344/530, loss: 0.001678474247455597 2023-01-24 07:53:34.388021: step: 348/530, loss: 0.013294276781380177 2023-01-24 07:53:35.438073: step: 352/530, loss: 0.0016472446732223034 2023-01-24 07:53:36.474412: step: 356/530, loss: 0.00019753299420699477 2023-01-24 07:53:37.519026: step: 360/530, loss: 0.00040297757368534803 2023-01-24 07:53:38.569655: step: 364/530, loss: 0.002236692002043128 2023-01-24 07:53:39.616426: step: 368/530, loss: 1.7517317246529274e-05 2023-01-24 07:53:40.666366: step: 372/530, loss: 0.0028147606644779444 2023-01-24 07:53:41.702510: step: 376/530, loss: 0.00019868843082804233 2023-01-24 07:53:42.768494: step: 380/530, loss: 0.0013912011636421084 2023-01-24 07:53:43.812659: step: 384/530, loss: 0.0004567632277030498 2023-01-24 07:53:44.855003: step: 388/530, loss: 0.0024846189189702272 2023-01-24 07:53:45.891596: step: 392/530, loss: 0.0014706613728776574 2023-01-24 07:53:46.927345: step: 396/530, loss: 0.0025192908942699432 2023-01-24 07:53:47.946939: step: 400/530, loss: 1.0619334716466255e-05 2023-01-24 07:53:48.980279: step: 404/530, loss: 0.005221816711127758 2023-01-24 07:53:50.019540: step: 408/530, loss: 0.0032732728868722916 2023-01-24 07:53:51.055720: step: 412/530, loss: 0.0005614410038106143 2023-01-24 07:53:52.116868: step: 416/530, loss: 0.0005032513290643692 2023-01-24 07:53:53.166364: step: 420/530, loss: 0.00025666714645922184 2023-01-24 07:53:54.197178: step: 424/530, loss: 1.5104700651136227e-05 2023-01-24 07:53:55.249786: step: 428/530, loss: 0.004815563093870878 2023-01-24 07:53:56.292620: step: 432/530, loss: 0.007909965701401234 2023-01-24 07:53:57.336475: step: 436/530, loss: 0.008411350660026073 2023-01-24 07:53:58.379118: step: 440/530, loss: 0.006662989035248756 2023-01-24 07:53:59.443857: step: 444/530, loss: 0.0008969720802269876 2023-01-24 07:54:00.516461: step: 448/530, loss: 0.0075895884074270725 2023-01-24 07:54:01.552337: step: 452/530, loss: 0.00031008778023533523 2023-01-24 07:54:02.599753: step: 456/530, loss: 0.0025365797337144613 2023-01-24 07:54:03.652574: step: 460/530, loss: 0.0006420926656574011 2023-01-24 07:54:04.699155: step: 464/530, loss: 0.00015697900380473584 2023-01-24 07:54:05.730012: step: 468/530, loss: 0.0003105918294750154 2023-01-24 07:54:06.781155: step: 472/530, loss: 0.003746391274034977 2023-01-24 07:54:07.822592: step: 476/530, loss: 0.0019301745342090726 2023-01-24 07:54:08.867539: step: 480/530, loss: 0.001170346513390541 2023-01-24 07:54:09.915669: step: 484/530, loss: 0.0064259907230734825 2023-01-24 07:54:10.967488: step: 488/530, loss: 0.010905269533395767 2023-01-24 07:54:12.012071: step: 492/530, loss: 0.002635349752381444 2023-01-24 07:54:13.046804: step: 496/530, loss: 0.0010565104894340038 2023-01-24 07:54:14.100898: step: 500/530, loss: 0.0025665778666734695 2023-01-24 07:54:15.154516: step: 504/530, loss: 0.0015071381349116564 2023-01-24 07:54:16.194807: step: 508/530, loss: 0.004104041960090399 2023-01-24 07:54:17.262203: step: 512/530, loss: 0.0004766838683281094 2023-01-24 07:54:18.300259: step: 516/530, loss: 0.01006765104830265 2023-01-24 07:54:19.345905: step: 520/530, loss: 0.01131446287035942 2023-01-24 07:54:20.420256: step: 524/530, loss: 0.002806006232276559 2023-01-24 07:54:21.462998: step: 528/530, loss: 0.004344320390373468 2023-01-24 07:54:22.506436: step: 532/530, loss: 0.004885183647274971 2023-01-24 07:54:23.552500: step: 536/530, loss: 0.0044850255362689495 2023-01-24 07:54:24.605845: step: 540/530, loss: 0.0004967250279150903 2023-01-24 07:54:25.658569: step: 544/530, loss: 0.003474026918411255 2023-01-24 07:54:26.703136: step: 548/530, loss: 0.008976250886917114 2023-01-24 07:54:27.746704: step: 552/530, loss: 0.00419862475246191 2023-01-24 07:54:28.792507: step: 556/530, loss: 0.002195636974647641 2023-01-24 07:54:29.834566: step: 560/530, loss: 0.0006492839311249554 2023-01-24 07:54:30.870314: step: 564/530, loss: 0.0010503239464014769 2023-01-24 07:54:31.898144: step: 568/530, loss: 0.0020240566227585077 2023-01-24 07:54:32.975380: step: 572/530, loss: 0.0011131631908938289 2023-01-24 07:54:34.013323: step: 576/530, loss: 0.0005042792181484401 2023-01-24 07:54:35.042605: step: 580/530, loss: 0.0003557713935151696 2023-01-24 07:54:36.094121: step: 584/530, loss: 0.002478155307471752 2023-01-24 07:54:37.131864: step: 588/530, loss: 0.0017400953220203519 2023-01-24 07:54:38.174294: step: 592/530, loss: 0.004249389749020338 2023-01-24 07:54:39.222995: step: 596/530, loss: 0.000572758901398629 2023-01-24 07:54:40.268951: step: 600/530, loss: 0.0101140346378088 2023-01-24 07:54:41.336117: step: 604/530, loss: 0.01079687848687172 2023-01-24 07:54:42.372418: step: 608/530, loss: 7.842260674806312e-05 2023-01-24 07:54:43.411188: step: 612/530, loss: 0.006186159327626228 2023-01-24 07:54:44.450144: step: 616/530, loss: 0.0027700604405254126 2023-01-24 07:54:45.494686: step: 620/530, loss: 0.003830282250419259 2023-01-24 07:54:46.570582: step: 624/530, loss: 0.00231066788546741 2023-01-24 07:54:47.610480: step: 628/530, loss: 0.001095293671824038 2023-01-24 07:54:48.644528: step: 632/530, loss: 0.0016686319140717387 2023-01-24 07:54:49.692385: step: 636/530, loss: 0.004468643572181463 2023-01-24 07:54:50.735547: step: 640/530, loss: 0.00012007312761852518 2023-01-24 07:54:51.779775: step: 644/530, loss: 0.0038229916244745255 2023-01-24 07:54:52.844796: step: 648/530, loss: 0.004569799639284611 2023-01-24 07:54:53.880567: step: 652/530, loss: 0.02937786653637886 2023-01-24 07:54:54.919365: step: 656/530, loss: 0.0012135922443121672 2023-01-24 07:54:55.970970: step: 660/530, loss: 0.01783234067261219 2023-01-24 07:54:57.019972: step: 664/530, loss: 0.001534773618914187 2023-01-24 07:54:58.062135: step: 668/530, loss: 4.680583151639439e-05 2023-01-24 07:54:59.100118: step: 672/530, loss: 0.0006945506320334971 2023-01-24 07:55:00.136722: step: 676/530, loss: 0.001785916625522077 2023-01-24 07:55:01.192845: step: 680/530, loss: 0.0009097285801544785 2023-01-24 07:55:02.243317: step: 684/530, loss: 0.013617118820548058 2023-01-24 07:55:03.282030: step: 688/530, loss: 0.0075601497665047646 2023-01-24 07:55:04.331523: step: 692/530, loss: 0.0013596635544672608 2023-01-24 07:55:05.358500: step: 696/530, loss: 0.00110805022995919 2023-01-24 07:55:06.406239: step: 700/530, loss: 0.00022816112323198467 2023-01-24 07:55:07.444435: step: 704/530, loss: 0.00010371807729825377 2023-01-24 07:55:08.480070: step: 708/530, loss: 0.0001237311662407592 2023-01-24 07:55:09.521000: step: 712/530, loss: 0.00999809056520462 2023-01-24 07:55:10.557271: step: 716/530, loss: 0.0037813351955264807 2023-01-24 07:55:11.600108: step: 720/530, loss: 0.0007650508196093142 2023-01-24 07:55:12.676146: step: 724/530, loss: 0.0012556056026369333 2023-01-24 07:55:13.711684: step: 728/530, loss: 0.0018612620187923312 2023-01-24 07:55:14.756597: step: 732/530, loss: 0.0004626192676369101 2023-01-24 07:55:15.784096: step: 736/530, loss: 0.004837325308471918 2023-01-24 07:55:16.827026: step: 740/530, loss: 0.0045120855793356895 2023-01-24 07:55:17.867379: step: 744/530, loss: 0.0004809291276615113 2023-01-24 07:55:18.896575: step: 748/530, loss: 5.323910227161832e-05 2023-01-24 07:55:19.952569: step: 752/530, loss: 0.0017554813530296087 2023-01-24 07:55:21.001582: step: 756/530, loss: 0.0012749754823744297 2023-01-24 07:55:22.041564: step: 760/530, loss: 0.0012977682054042816 2023-01-24 07:55:23.098340: step: 764/530, loss: 3.463034227024764e-05 2023-01-24 07:55:24.146226: step: 768/530, loss: 0.0042152502574026585 2023-01-24 07:55:25.175112: step: 772/530, loss: 0.0019875760190188885 2023-01-24 07:55:26.203875: step: 776/530, loss: 0.002290158299729228 2023-01-24 07:55:27.235320: step: 780/530, loss: 0.00346802338026464 2023-01-24 07:55:28.273472: step: 784/530, loss: 0.0013296926626935601 2023-01-24 07:55:29.323631: step: 788/530, loss: 0.0002059193648165092 2023-01-24 07:55:30.361962: step: 792/530, loss: 0.0 2023-01-24 07:55:31.401361: step: 796/530, loss: 0.0033771954476833344 2023-01-24 07:55:32.454601: step: 800/530, loss: 0.002392198657616973 2023-01-24 07:55:33.499704: step: 804/530, loss: 0.0033652542624622583 2023-01-24 07:55:34.570024: step: 808/530, loss: 0.005677748937159777 2023-01-24 07:55:35.620297: step: 812/530, loss: 0.0010957029880955815 2023-01-24 07:55:36.648890: step: 816/530, loss: 0.001103114802390337 2023-01-24 07:55:37.701582: step: 820/530, loss: 0.00021666464454028755 2023-01-24 07:55:38.739577: step: 824/530, loss: 0.009038028307259083 2023-01-24 07:55:39.782688: step: 828/530, loss: 0.0003519484307616949 2023-01-24 07:55:40.848251: step: 832/530, loss: 0.001531408284790814 2023-01-24 07:55:41.901229: step: 836/530, loss: 0.002708738436922431 2023-01-24 07:55:42.953378: step: 840/530, loss: 0.0017759923357516527 2023-01-24 07:55:43.999595: step: 844/530, loss: 0.0012091611279174685 2023-01-24 07:55:45.033481: step: 848/530, loss: 0.00458544073626399 2023-01-24 07:55:46.065106: step: 852/530, loss: 0.0015374617651104927 2023-01-24 07:55:47.123475: step: 856/530, loss: 0.0013794736005365849 2023-01-24 07:55:48.162608: step: 860/530, loss: 0.009434523992240429 2023-01-24 07:55:49.207238: step: 864/530, loss: 0.002033942611888051 2023-01-24 07:55:50.242672: step: 868/530, loss: 0.0017239798326045275 2023-01-24 07:55:51.282096: step: 872/530, loss: 0.0002994116803165525 2023-01-24 07:55:52.321109: step: 876/530, loss: 0.0005237242439761758 2023-01-24 07:55:53.371868: step: 880/530, loss: 0.00527963088825345 2023-01-24 07:55:54.428301: step: 884/530, loss: 0.006941282190382481 2023-01-24 07:55:55.485301: step: 888/530, loss: 0.0008123686420731246 2023-01-24 07:55:56.533147: step: 892/530, loss: 7.46598161640577e-05 2023-01-24 07:55:57.573280: step: 896/530, loss: 0.0006259792717173696 2023-01-24 07:55:58.605655: step: 900/530, loss: 6.782382115488872e-05 2023-01-24 07:55:59.656370: step: 904/530, loss: 0.0014336572494357824 2023-01-24 07:56:00.685575: step: 908/530, loss: 0.006972672417759895 2023-01-24 07:56:01.725762: step: 912/530, loss: 0.004512323532253504 2023-01-24 07:56:02.778896: step: 916/530, loss: 1.4524814105243422e-05 2023-01-24 07:56:03.825724: step: 920/530, loss: 0.0013026637025177479 2023-01-24 07:56:04.872118: step: 924/530, loss: 0.0010842892806977034 2023-01-24 07:56:05.907610: step: 928/530, loss: 0.0010095477337017655 2023-01-24 07:56:06.973318: step: 932/530, loss: 0.006881438195705414 2023-01-24 07:56:08.030211: step: 936/530, loss: 0.0007780453306622803 2023-01-24 07:56:09.081952: step: 940/530, loss: 0.002386632142588496 2023-01-24 07:56:10.116996: step: 944/530, loss: 0.004146643448621035 2023-01-24 07:56:11.150173: step: 948/530, loss: 0.020527713000774384 2023-01-24 07:56:12.214746: step: 952/530, loss: 0.004596620332449675 2023-01-24 07:56:13.268657: step: 956/530, loss: 0.0013360029552131891 2023-01-24 07:56:14.335441: step: 960/530, loss: 0.003200882114470005 2023-01-24 07:56:15.386949: step: 964/530, loss: 0.004382890649139881 2023-01-24 07:56:16.433255: step: 968/530, loss: 0.004832218401134014 2023-01-24 07:56:17.462961: step: 972/530, loss: 9.911083907354623e-06 2023-01-24 07:56:18.498261: step: 976/530, loss: 0.0022042514756321907 2023-01-24 07:56:19.527563: step: 980/530, loss: 0.0018994336714968085 2023-01-24 07:56:20.562096: step: 984/530, loss: 0.004117816686630249 2023-01-24 07:56:21.607025: step: 988/530, loss: 0.011310254223644733 2023-01-24 07:56:22.662848: step: 992/530, loss: 0.006619452033191919 2023-01-24 07:56:23.720983: step: 996/530, loss: 0.0003443750028964132 2023-01-24 07:56:24.766605: step: 1000/530, loss: 0.003024142701178789 2023-01-24 07:56:25.823430: step: 1004/530, loss: 0.0006079613231122494 2023-01-24 07:56:26.859509: step: 1008/530, loss: 0.004931787960231304 2023-01-24 07:56:27.903787: step: 1012/530, loss: 0.00228464649990201 2023-01-24 07:56:28.935666: step: 1016/530, loss: 1.127155246649636e-05 2023-01-24 07:56:29.991218: step: 1020/530, loss: 0.007504436653107405 2023-01-24 07:56:31.030072: step: 1024/530, loss: 0.002850524615496397 2023-01-24 07:56:32.070716: step: 1028/530, loss: 0.003923813346773386 2023-01-24 07:56:33.149253: step: 1032/530, loss: 0.0017447317950427532 2023-01-24 07:56:34.195938: step: 1036/530, loss: 0.008256851695477962 2023-01-24 07:56:35.238894: step: 1040/530, loss: 0.00262592569924891 2023-01-24 07:56:36.292583: step: 1044/530, loss: 0.006396498531103134 2023-01-24 07:56:37.322733: step: 1048/530, loss: 7.4719591793837026e-06 2023-01-24 07:56:38.368317: step: 1052/530, loss: 0.007519092410802841 2023-01-24 07:56:39.406259: step: 1056/530, loss: 0.0030573117546737194 2023-01-24 07:56:40.469649: step: 1060/530, loss: 0.008097074925899506 2023-01-24 07:56:41.509326: step: 1064/530, loss: 0.006410520989447832 2023-01-24 07:56:42.558407: step: 1068/530, loss: 0.001324211130850017 2023-01-24 07:56:43.608564: step: 1072/530, loss: 0.0017862874083220959 2023-01-24 07:56:44.644343: step: 1076/530, loss: 0.00012042235175613314 2023-01-24 07:56:45.684327: step: 1080/530, loss: 0.004782073199748993 2023-01-24 07:56:46.733313: step: 1084/530, loss: 0.006423020735383034 2023-01-24 07:56:47.787761: step: 1088/530, loss: 0.006951035000383854 2023-01-24 07:56:48.856844: step: 1092/530, loss: 0.005228972993791103 2023-01-24 07:56:49.912722: step: 1096/530, loss: 0.002004253910854459 2023-01-24 07:56:50.950175: step: 1100/530, loss: 0.0004658708057831973 2023-01-24 07:56:51.983493: step: 1104/530, loss: 0.0015666185645386577 2023-01-24 07:56:53.023591: step: 1108/530, loss: 0.000201524788280949 2023-01-24 07:56:54.057575: step: 1112/530, loss: 0.004110785201191902 2023-01-24 07:56:55.100451: step: 1116/530, loss: 0.000454398657893762 2023-01-24 07:56:56.149940: step: 1120/530, loss: 1.807861917768605e-05 2023-01-24 07:56:57.187116: step: 1124/530, loss: 0.0013572170864790678 2023-01-24 07:56:58.239313: step: 1128/530, loss: 0.015525279566645622 2023-01-24 07:56:59.280216: step: 1132/530, loss: 0.0018248233245685697 2023-01-24 07:57:00.312607: step: 1136/530, loss: 0.0031671100296080112 2023-01-24 07:57:01.358125: step: 1140/530, loss: 0.0015235089231282473 2023-01-24 07:57:02.397079: step: 1144/530, loss: 0.0015720115043222904 2023-01-24 07:57:03.467115: step: 1148/530, loss: 0.003198369173333049 2023-01-24 07:57:04.502509: step: 1152/530, loss: 0.0075254314579069614 2023-01-24 07:57:05.538407: step: 1156/530, loss: 0.0025483807548880577 2023-01-24 07:57:06.574145: step: 1160/530, loss: 0.0008820623625069857 2023-01-24 07:57:07.617801: step: 1164/530, loss: 0.003434132318943739 2023-01-24 07:57:08.648243: step: 1168/530, loss: 0.001195478136651218 2023-01-24 07:57:09.698292: step: 1172/530, loss: 0.0008998954435810447 2023-01-24 07:57:10.748325: step: 1176/530, loss: 0.015672490000724792 2023-01-24 07:57:11.783962: step: 1180/530, loss: 1.0297398148395587e-05 2023-01-24 07:57:12.827877: step: 1184/530, loss: 8.247247933468316e-07 2023-01-24 07:57:13.884464: step: 1188/530, loss: 0.005459130275994539 2023-01-24 07:57:14.924530: step: 1192/530, loss: 0.0014366828836500645 2023-01-24 07:57:15.976826: step: 1196/530, loss: 0.009928080253303051 2023-01-24 07:57:17.032051: step: 1200/530, loss: 0.007221674080938101 2023-01-24 07:57:18.082604: step: 1204/530, loss: 0.0009354190551675856 2023-01-24 07:57:19.133955: step: 1208/530, loss: 0.00037409987999126315 2023-01-24 07:57:20.184884: step: 1212/530, loss: 0.0004136855131946504 2023-01-24 07:57:21.233399: step: 1216/530, loss: 0.006305725779384375 2023-01-24 07:57:22.279825: step: 1220/530, loss: 0.01098248828202486 2023-01-24 07:57:23.317364: step: 1224/530, loss: 0.006228860933333635 2023-01-24 07:57:24.358097: step: 1228/530, loss: 0.0011418212670832872 2023-01-24 07:57:25.410164: step: 1232/530, loss: 0.009525150060653687 2023-01-24 07:57:26.453660: step: 1236/530, loss: 0.001546103972941637 2023-01-24 07:57:27.473347: step: 1240/530, loss: 0.0011437057983130217 2023-01-24 07:57:28.521926: step: 1244/530, loss: 0.00028179859509691596 2023-01-24 07:57:29.573213: step: 1248/530, loss: 0.008376537822186947 2023-01-24 07:57:30.605399: step: 1252/530, loss: 0.003715341677889228 2023-01-24 07:57:31.628119: step: 1256/530, loss: 0.0007436055457219481 2023-01-24 07:57:32.664908: step: 1260/530, loss: 0.0003102657210547477 2023-01-24 07:57:33.729940: step: 1264/530, loss: 0.004909284878522158 2023-01-24 07:57:34.761831: step: 1268/530, loss: 0.0020371167920529842 2023-01-24 07:57:35.801462: step: 1272/530, loss: 0.0004898647894151509 2023-01-24 07:57:36.845834: step: 1276/530, loss: 0.0015563125489279628 2023-01-24 07:57:37.885999: step: 1280/530, loss: 0.00689957058057189 2023-01-24 07:57:38.946108: step: 1284/530, loss: 0.01408822275698185 2023-01-24 07:57:39.986417: step: 1288/530, loss: 0.0013574474724009633 2023-01-24 07:57:41.035968: step: 1292/530, loss: 0.0009641749784350395 2023-01-24 07:57:42.069185: step: 1296/530, loss: 0.0003385709715075791 2023-01-24 07:57:43.108295: step: 1300/530, loss: 0.0004961580852977931 2023-01-24 07:57:44.133917: step: 1304/530, loss: 0.00020141866116318852 2023-01-24 07:57:45.195909: step: 1308/530, loss: 5.165263428352773e-05 2023-01-24 07:57:46.227367: step: 1312/530, loss: 0.006631826050579548 2023-01-24 07:57:47.264248: step: 1316/530, loss: 0.0006990053225308657 2023-01-24 07:57:48.300459: step: 1320/530, loss: 0.007975384593009949 2023-01-24 07:57:49.340703: step: 1324/530, loss: 0.0028748069889843464 2023-01-24 07:57:50.385990: step: 1328/530, loss: 0.006206345744431019 2023-01-24 07:57:51.428603: step: 1332/530, loss: 0.0004804233321920037 2023-01-24 07:57:52.474131: step: 1336/530, loss: 6.444739847211167e-05 2023-01-24 07:57:53.529111: step: 1340/530, loss: 0.0003802002756856382 2023-01-24 07:57:54.546805: step: 1344/530, loss: 0.0006370485061779618 2023-01-24 07:57:55.596977: step: 1348/530, loss: 0.00022640205861534923 2023-01-24 07:57:56.628589: step: 1352/530, loss: 0.0003381062124390155 2023-01-24 07:57:57.668002: step: 1356/530, loss: 0.004661472514271736 2023-01-24 07:57:58.713574: step: 1360/530, loss: 0.00735260546207428 2023-01-24 07:57:59.755977: step: 1364/530, loss: 0.0018966750940307975 2023-01-24 07:58:00.800725: step: 1368/530, loss: 0.006832683924585581 2023-01-24 07:58:01.844017: step: 1372/530, loss: 0.0013224206632003188 2023-01-24 07:58:02.883246: step: 1376/530, loss: 0.00016277357644867152 2023-01-24 07:58:03.926078: step: 1380/530, loss: 0.0006611610297113657 2023-01-24 07:58:04.979768: step: 1384/530, loss: 0.012600972317159176 2023-01-24 07:58:06.023423: step: 1388/530, loss: 0.0026991211343556643 2023-01-24 07:58:07.061904: step: 1392/530, loss: 0.022808486595749855 2023-01-24 07:58:08.114750: step: 1396/530, loss: 0.004014855716377497 2023-01-24 07:58:09.165694: step: 1400/530, loss: 0.005654542241245508 2023-01-24 07:58:10.202272: step: 1404/530, loss: 0.0016142316162586212 2023-01-24 07:58:11.254496: step: 1408/530, loss: 0.00030001590494066477 2023-01-24 07:58:12.289555: step: 1412/530, loss: 9.525947098154575e-05 2023-01-24 07:58:13.333975: step: 1416/530, loss: 0.0052554854191839695 2023-01-24 07:58:14.378317: step: 1420/530, loss: 0.0031585076358169317 2023-01-24 07:58:15.443392: step: 1424/530, loss: 0.00024226700770668685 2023-01-24 07:58:16.485411: step: 1428/530, loss: 0.0002838248328771442 2023-01-24 07:58:17.551509: step: 1432/530, loss: 0.0018992993282154202 2023-01-24 07:58:18.590454: step: 1436/530, loss: 0.00041687930934131145 2023-01-24 07:58:19.627179: step: 1440/530, loss: 0.0003345505683682859 2023-01-24 07:58:20.664870: step: 1444/530, loss: 0.0004599524545483291 2023-01-24 07:58:21.700445: step: 1448/530, loss: 0.00152059574611485 2023-01-24 07:58:22.747597: step: 1452/530, loss: 0.0010197223164141178 2023-01-24 07:58:23.772335: step: 1456/530, loss: 3.068601927225245e-06 2023-01-24 07:58:24.813864: step: 1460/530, loss: 0.00119457533583045 2023-01-24 07:58:25.848697: step: 1464/530, loss: 0.004676337353885174 2023-01-24 07:58:26.878234: step: 1468/530, loss: 0.0012967294314876199 2023-01-24 07:58:27.919174: step: 1472/530, loss: 0.00697213364765048 2023-01-24 07:58:28.945029: step: 1476/530, loss: 5.374971806304529e-05 2023-01-24 07:58:29.984979: step: 1480/530, loss: 0.0007884575170464814 2023-01-24 07:58:31.033025: step: 1484/530, loss: 0.0026752299163490534 2023-01-24 07:58:32.085594: step: 1488/530, loss: 0.007478209678083658 2023-01-24 07:58:33.140445: step: 1492/530, loss: 0.008206604979932308 2023-01-24 07:58:34.174182: step: 1496/530, loss: 7.746687333565205e-05 2023-01-24 07:58:35.219620: step: 1500/530, loss: 0.0017835705075412989 2023-01-24 07:58:36.259305: step: 1504/530, loss: 0.0011131709907203913 2023-01-24 07:58:37.307929: step: 1508/530, loss: 0.00066353939473629 2023-01-24 07:58:38.353481: step: 1512/530, loss: 0.0008853027247823775 2023-01-24 07:58:39.397709: step: 1516/530, loss: 0.015615081414580345 2023-01-24 07:58:40.443965: step: 1520/530, loss: 0.001807558466680348 2023-01-24 07:58:41.479066: step: 1524/530, loss: 0.0009274403564631939 2023-01-24 07:58:42.538581: step: 1528/530, loss: 0.011650248430669308 2023-01-24 07:58:43.568539: step: 1532/530, loss: 0.0053371889516711235 2023-01-24 07:58:44.614230: step: 1536/530, loss: 0.012244739569723606 2023-01-24 07:58:45.660616: step: 1540/530, loss: 0.022946396842598915 2023-01-24 07:58:46.689579: step: 1544/530, loss: 0.003774950047954917 2023-01-24 07:58:47.747833: step: 1548/530, loss: 0.008275489322841167 2023-01-24 07:58:48.784033: step: 1552/530, loss: 0.006017662584781647 2023-01-24 07:58:49.850415: step: 1556/530, loss: 0.004965306259691715 2023-01-24 07:58:50.885749: step: 1560/530, loss: 0.01910923235118389 2023-01-24 07:58:51.931426: step: 1564/530, loss: 0.0017008964205160737 2023-01-24 07:58:52.980835: step: 1568/530, loss: 0.002094108145684004 2023-01-24 07:58:54.016456: step: 1572/530, loss: 0.013499675318598747 2023-01-24 07:58:55.063581: step: 1576/530, loss: 0.0012263128301128745 2023-01-24 07:58:56.116865: step: 1580/530, loss: 0.004750311840325594 2023-01-24 07:58:57.171483: step: 1584/530, loss: 0.0055891671217978 2023-01-24 07:58:58.212977: step: 1588/530, loss: 0.0003754783538170159 2023-01-24 07:58:59.259451: step: 1592/530, loss: 0.0022290972992777824 2023-01-24 07:59:00.310081: step: 1596/530, loss: 0.004460914526134729 2023-01-24 07:59:01.343955: step: 1600/530, loss: 0.0022637643851339817 2023-01-24 07:59:02.400006: step: 1604/530, loss: 0.004388181492686272 2023-01-24 07:59:03.471899: step: 1608/530, loss: 0.0027250046841800213 2023-01-24 07:59:04.512766: step: 1612/530, loss: 0.00166132056619972 2023-01-24 07:59:05.553682: step: 1616/530, loss: 0.0002281893539475277 2023-01-24 07:59:06.597622: step: 1620/530, loss: 0.0041305809281766415 2023-01-24 07:59:07.629965: step: 1624/530, loss: 0.003262830898165703 2023-01-24 07:59:08.659840: step: 1628/530, loss: 0.0064003304578363895 2023-01-24 07:59:09.704544: step: 1632/530, loss: 0.0025947396643459797 2023-01-24 07:59:10.746659: step: 1636/530, loss: 0.0004289246862754226 2023-01-24 07:59:11.796587: step: 1640/530, loss: 0.0015038494020700455 2023-01-24 07:59:12.839252: step: 1644/530, loss: 0.0022568402346223593 2023-01-24 07:59:13.871469: step: 1648/530, loss: 0.00014186625776346773 2023-01-24 07:59:14.902450: step: 1652/530, loss: 0.0025793511886149645 2023-01-24 07:59:15.940658: step: 1656/530, loss: 0.001760231563821435 2023-01-24 07:59:16.980102: step: 1660/530, loss: 0.005591913126409054 2023-01-24 07:59:18.017513: step: 1664/530, loss: 0.001139389001764357 2023-01-24 07:59:19.060319: step: 1668/530, loss: 0.001222749357111752 2023-01-24 07:59:20.109331: step: 1672/530, loss: 0.003349478356540203 2023-01-24 07:59:21.160824: step: 1676/530, loss: 0.008537529967725277 2023-01-24 07:59:22.201112: step: 1680/530, loss: 0.0171780027449131 2023-01-24 07:59:23.232496: step: 1684/530, loss: 0.0007790369563736022 2023-01-24 07:59:24.263601: step: 1688/530, loss: 0.0025134822353720665 2023-01-24 07:59:25.307833: step: 1692/530, loss: 0.00345806498080492 2023-01-24 07:59:26.337567: step: 1696/530, loss: 0.0006331720505841076 2023-01-24 07:59:27.389307: step: 1700/530, loss: 0.007373058702796698 2023-01-24 07:59:28.434607: step: 1704/530, loss: 0.002492961473762989 2023-01-24 07:59:29.473659: step: 1708/530, loss: 0.0017996786627918482 2023-01-24 07:59:30.501346: step: 1712/530, loss: 0.006417486350983381 2023-01-24 07:59:31.525405: step: 1716/530, loss: 0.006842451170086861 2023-01-24 07:59:32.559392: step: 1720/530, loss: 0.004541672766208649 2023-01-24 07:59:33.621464: step: 1724/530, loss: 9.892897651297972e-05 2023-01-24 07:59:34.656843: step: 1728/530, loss: 0.004635293036699295 2023-01-24 07:59:35.705446: step: 1732/530, loss: 0.00627547362819314 2023-01-24 07:59:36.736762: step: 1736/530, loss: 0.0007424906943924725 2023-01-24 07:59:37.773956: step: 1740/530, loss: 0.0013969799038022757 2023-01-24 07:59:38.822015: step: 1744/530, loss: 0.0008021194371394813 2023-01-24 07:59:39.856711: step: 1748/530, loss: 5.0191716582048684e-05 2023-01-24 07:59:40.896181: step: 1752/530, loss: 0.00019830631208606064 2023-01-24 07:59:41.937337: step: 1756/530, loss: 0.0036961957812309265 2023-01-24 07:59:42.979165: step: 1760/530, loss: 0.0029901741072535515 2023-01-24 07:59:43.996448: step: 1764/530, loss: 0.0009864509338513017 2023-01-24 07:59:45.034423: step: 1768/530, loss: 0.014718879945576191 2023-01-24 07:59:46.093678: step: 1772/530, loss: 0.0014967393362894654 2023-01-24 07:59:47.129494: step: 1776/530, loss: 4.8162855819100514e-05 2023-01-24 07:59:48.161440: step: 1780/530, loss: 0.0028091403655707836 2023-01-24 07:59:49.221768: step: 1784/530, loss: 0.0034796022810041904 2023-01-24 07:59:50.284505: step: 1788/530, loss: 0.0015455796383321285 2023-01-24 07:59:51.318418: step: 1792/530, loss: 0.0013961036456748843 2023-01-24 07:59:52.360383: step: 1796/530, loss: 2.421425620013906e-07 2023-01-24 07:59:53.411507: step: 1800/530, loss: 0.004253959283232689 2023-01-24 07:59:54.462167: step: 1804/530, loss: 0.030879884958267212 2023-01-24 07:59:55.502693: step: 1808/530, loss: 0.0007402389892376959 2023-01-24 07:59:56.548460: step: 1812/530, loss: 0.005029305815696716 2023-01-24 07:59:57.606372: step: 1816/530, loss: 0.003805961227044463 2023-01-24 07:59:58.641184: step: 1820/530, loss: 0.0009683383977971971 2023-01-24 07:59:59.682298: step: 1824/530, loss: 0.00042147599742747843 2023-01-24 08:00:00.733586: step: 1828/530, loss: 0.005095311440527439 2023-01-24 08:00:01.790175: step: 1832/530, loss: 0.0033117649145424366 2023-01-24 08:00:02.839164: step: 1836/530, loss: 0.0026411789003759623 2023-01-24 08:00:03.884007: step: 1840/530, loss: 0.0006687751156277955 2023-01-24 08:00:04.939055: step: 1844/530, loss: 0.004634995013475418 2023-01-24 08:00:05.983372: step: 1848/530, loss: 0.005392204038798809 2023-01-24 08:00:07.035895: step: 1852/530, loss: 0.0026288365479558706 2023-01-24 08:00:08.082134: step: 1856/530, loss: 0.00632264232262969 2023-01-24 08:00:09.130730: step: 1860/530, loss: 0.0009048838983289897 2023-01-24 08:00:10.176344: step: 1864/530, loss: 0.0012034325627610087 2023-01-24 08:00:11.219157: step: 1868/530, loss: 0.003303315956145525 2023-01-24 08:00:12.251701: step: 1872/530, loss: 0.00016991447773762047 2023-01-24 08:00:13.281867: step: 1876/530, loss: 0.0015578686725348234 2023-01-24 08:00:14.313691: step: 1880/530, loss: 0.0011157433036714792 2023-01-24 08:00:15.358234: step: 1884/530, loss: 0.00041672654333524406 2023-01-24 08:00:16.388537: step: 1888/530, loss: 0.0023167794570326805 2023-01-24 08:00:17.433851: step: 1892/530, loss: 0.002052611205726862 2023-01-24 08:00:18.478063: step: 1896/530, loss: 0.0033763970714062452 2023-01-24 08:00:19.513538: step: 1900/530, loss: 0.00025242497213184834 2023-01-24 08:00:20.569386: step: 1904/530, loss: 0.009918239898979664 2023-01-24 08:00:21.616575: step: 1908/530, loss: 0.0038157969247549772 2023-01-24 08:00:22.650220: step: 1912/530, loss: 7.49468085814442e-07 2023-01-24 08:00:23.722544: step: 1916/530, loss: 0.004472915083169937 2023-01-24 08:00:24.770407: step: 1920/530, loss: 0.0039259870536625385 2023-01-24 08:00:25.822280: step: 1924/530, loss: 0.001096860971301794 2023-01-24 08:00:26.870817: step: 1928/530, loss: 0.0014287614030763507 2023-01-24 08:00:27.908421: step: 1932/530, loss: 0.01082514226436615 2023-01-24 08:00:28.947858: step: 1936/530, loss: 0.0008983967709355056 2023-01-24 08:00:29.984401: step: 1940/530, loss: 0.0008533830987289548 2023-01-24 08:00:31.025001: step: 1944/530, loss: 0.006071763578802347 2023-01-24 08:00:32.084619: step: 1948/530, loss: 0.0013380680466070771 2023-01-24 08:00:33.159491: step: 1952/530, loss: 0.002897057216614485 2023-01-24 08:00:34.194864: step: 1956/530, loss: 7.528057903982699e-05 2023-01-24 08:00:35.230051: step: 1960/530, loss: 0.0166124626994133 2023-01-24 08:00:36.268366: step: 1964/530, loss: 0.00010313720122212544 2023-01-24 08:00:37.302329: step: 1968/530, loss: 0.005741137079894543 2023-01-24 08:00:38.337094: step: 1972/530, loss: 0.004160319920629263 2023-01-24 08:00:39.377806: step: 1976/530, loss: 0.0030549473594874144 2023-01-24 08:00:40.430910: step: 1980/530, loss: 0.009821810759603977 2023-01-24 08:00:41.491034: step: 1984/530, loss: 0.005508612375706434 2023-01-24 08:00:42.539981: step: 1988/530, loss: 0.0002229307865491137 2023-01-24 08:00:43.584775: step: 1992/530, loss: 0.0031040431931614876 2023-01-24 08:00:44.622328: step: 1996/530, loss: 0.007389459293335676 2023-01-24 08:00:45.669592: step: 2000/530, loss: 0.0053385659120976925 2023-01-24 08:00:46.729140: step: 2004/530, loss: 0.016554879024624825 2023-01-24 08:00:47.767757: step: 2008/530, loss: 0.0011714758584275842 2023-01-24 08:00:48.796849: step: 2012/530, loss: 0.0011744378134608269 2023-01-24 08:00:49.854224: step: 2016/530, loss: 0.00011427033314248547 2023-01-24 08:00:50.908577: step: 2020/530, loss: 0.0008475541253574193 2023-01-24 08:00:51.959246: step: 2024/530, loss: 2.2833064576843753e-05 2023-01-24 08:00:52.986135: step: 2028/530, loss: 5.888010127819143e-05 2023-01-24 08:00:54.029356: step: 2032/530, loss: 0.0005154501413926482 2023-01-24 08:00:55.077176: step: 2036/530, loss: 0.00427416292950511 2023-01-24 08:00:56.115325: step: 2040/530, loss: 6.227390986168757e-05 2023-01-24 08:00:57.160877: step: 2044/530, loss: 0.0053716301918029785 2023-01-24 08:00:58.197895: step: 2048/530, loss: 0.0017645315965637565 2023-01-24 08:00:59.227599: step: 2052/530, loss: 0.004234227351844311 2023-01-24 08:01:00.260727: step: 2056/530, loss: 0.00022972305305302143 2023-01-24 08:01:01.286368: step: 2060/530, loss: 0.0005670490209013224 2023-01-24 08:01:02.322137: step: 2064/530, loss: 4.39680752606364e-06 2023-01-24 08:01:03.395133: step: 2068/530, loss: 0.0014795800670981407 2023-01-24 08:01:04.438722: step: 2072/530, loss: 3.195781755493954e-05 2023-01-24 08:01:05.466505: step: 2076/530, loss: 0.00021024089073762298 2023-01-24 08:01:06.502154: step: 2080/530, loss: 0.0034581993240863085 2023-01-24 08:01:07.548508: step: 2084/530, loss: 0.0009797518141567707 2023-01-24 08:01:08.574689: step: 2088/530, loss: 0.00436271820217371 2023-01-24 08:01:09.619554: step: 2092/530, loss: 0.0048765395767986774 2023-01-24 08:01:10.662926: step: 2096/530, loss: 2.4802049665595405e-05 2023-01-24 08:01:11.701329: step: 2100/530, loss: 0.0007195995422080159 2023-01-24 08:01:12.744180: step: 2104/530, loss: 0.0010806828504428267 2023-01-24 08:01:13.792730: step: 2108/530, loss: 0.024447450414299965 2023-01-24 08:01:14.826573: step: 2112/530, loss: 0.005292092449963093 2023-01-24 08:01:15.889968: step: 2116/530, loss: 0.003660043003037572 2023-01-24 08:01:16.932592: step: 2120/530, loss: 0.0012359905522316694 ================================================== Loss: 0.004 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3781810538116592, 'r': 0.32005455407969635, 'f1': 0.34669835560123324}, 'combined': 0.25546194623248764, 'stategy': 1, 'epoch': 15} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.375326390093726, 'r': 0.3898150926524911, 'f1': 0.382433562494058}, 'combined': 0.2964317565743416, 'stategy': 1, 'epoch': 15} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3899899678972713, 'r': 0.32930841691515317, 'f1': 0.35708957965902416}, 'combined': 0.26311863764349147, 'stategy': 1, 'epoch': 15} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3731503814117339, 'r': 0.3686917831044246, 'f1': 0.3709076837888247}, 'combined': 0.2874978218841608, 'stategy': 1, 'epoch': 15} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 15} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 15} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15} New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15} ****************************** Epoch: 16 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 08:03:48.912055: step: 4/530, loss: 9.7860254754778e-05 2023-01-24 08:03:49.964465: step: 8/530, loss: 0.00016962077643256634 2023-01-24 08:03:51.010700: step: 12/530, loss: 0.00167995342053473 2023-01-24 08:03:52.041530: step: 16/530, loss: 0.0009895809926092625 2023-01-24 08:03:53.074076: step: 20/530, loss: 0.0008334103040397167 2023-01-24 08:03:54.120938: step: 24/530, loss: 0.0017199110006913543 2023-01-24 08:03:55.159042: step: 28/530, loss: 0.0062159881927073 2023-01-24 08:03:56.239103: step: 32/530, loss: 0.06644850969314575 2023-01-24 08:03:57.273012: step: 36/530, loss: 0.0005407019634731114 2023-01-24 08:03:58.293488: step: 40/530, loss: 0.0012492379173636436 2023-01-24 08:03:59.322730: step: 44/530, loss: 0.0001143816189141944 2023-01-24 08:04:00.366365: step: 48/530, loss: 0.002293126657605171 2023-01-24 08:04:01.400417: step: 52/530, loss: 0.001609840546734631 2023-01-24 08:04:02.436297: step: 56/530, loss: 0.002481231465935707 2023-01-24 08:04:03.480369: step: 60/530, loss: 0.004079022910445929 2023-01-24 08:04:04.508405: step: 64/530, loss: 0.0015545889036729932 2023-01-24 08:04:05.563856: step: 68/530, loss: 0.0013371296226978302 2023-01-24 08:04:06.599491: step: 72/530, loss: 0.0033272304572165012 2023-01-24 08:04:07.654057: step: 76/530, loss: 0.00012407192843966186 2023-01-24 08:04:08.708202: step: 80/530, loss: 0.001283716526813805 2023-01-24 08:04:09.747555: step: 84/530, loss: 0.00013375292473938316 2023-01-24 08:04:10.803513: step: 88/530, loss: 0.012221149168908596 2023-01-24 08:04:11.857757: step: 92/530, loss: 3.227633351343684e-05 2023-01-24 08:04:12.908798: step: 96/530, loss: 0.0001579405361553654 2023-01-24 08:04:13.955444: step: 100/530, loss: 0.00021769414888694882 2023-01-24 08:04:15.027153: step: 104/530, loss: 0.01837671548128128 2023-01-24 08:04:16.064928: step: 108/530, loss: 0.0011274643475189805 2023-01-24 08:04:17.116080: step: 112/530, loss: 0.005027633160352707 2023-01-24 08:04:18.156322: step: 116/530, loss: 0.008041074499487877 2023-01-24 08:04:19.206053: step: 120/530, loss: 0.0029558383394032717 2023-01-24 08:04:20.245022: step: 124/530, loss: 9.197644249070436e-05 2023-01-24 08:04:21.295313: step: 128/530, loss: 0.000355173455318436 2023-01-24 08:04:22.340525: step: 132/530, loss: 0.011277411133050919 2023-01-24 08:04:23.392684: step: 136/530, loss: 0.005733049940317869 2023-01-24 08:04:24.419787: step: 140/530, loss: 0.0035273684188723564 2023-01-24 08:04:25.458645: step: 144/530, loss: 2.521784699638374e-05 2023-01-24 08:04:26.489097: step: 148/530, loss: 0.0005182532477192581 2023-01-24 08:04:27.552482: step: 152/530, loss: 0.002032036427408457 2023-01-24 08:04:28.583515: step: 156/530, loss: 0.005944725591689348 2023-01-24 08:04:29.630259: step: 160/530, loss: 0.003832010319456458 2023-01-24 08:04:30.672069: step: 164/530, loss: 0.0005498633836396039 2023-01-24 08:04:31.711478: step: 168/530, loss: 0.0001618832175154239 2023-01-24 08:04:32.757598: step: 172/530, loss: 0.004295145161449909 2023-01-24 08:04:33.790092: step: 176/530, loss: 0.02098417654633522 2023-01-24 08:04:34.822476: step: 180/530, loss: 0.00642936397343874 2023-01-24 08:04:35.872658: step: 184/530, loss: 0.002964233048260212 2023-01-24 08:04:36.919704: step: 188/530, loss: 0.01809658482670784 2023-01-24 08:04:37.960027: step: 192/530, loss: 0.024744180962443352 2023-01-24 08:04:39.000762: step: 196/530, loss: 0.003283710451796651 2023-01-24 08:04:40.034421: step: 200/530, loss: 0.004359710030257702 2023-01-24 08:04:41.088657: step: 204/530, loss: 0.002236847300082445 2023-01-24 08:04:42.124562: step: 208/530, loss: 0.0014879833906888962 2023-01-24 08:04:43.183355: step: 212/530, loss: 0.018451759591698647 2023-01-24 08:04:44.241852: step: 216/530, loss: 0.00911922100931406 2023-01-24 08:04:45.278488: step: 220/530, loss: 0.001353578525595367 2023-01-24 08:04:46.320868: step: 224/530, loss: 0.003076187102124095 2023-01-24 08:04:47.356691: step: 228/530, loss: 0.0009704912081360817 2023-01-24 08:04:48.385929: step: 232/530, loss: 0.01017417386174202 2023-01-24 08:04:49.419781: step: 236/530, loss: 0.0063122049905359745 2023-01-24 08:04:50.473391: step: 240/530, loss: 0.011784515343606472 2023-01-24 08:04:51.513416: step: 244/530, loss: 0.0014640557346865535 2023-01-24 08:04:52.550618: step: 248/530, loss: 0.00040300979162566364 2023-01-24 08:04:53.609443: step: 252/530, loss: 0.001958419568836689 2023-01-24 08:04:54.668309: step: 256/530, loss: 0.005494561977684498 2023-01-24 08:04:55.728772: step: 260/530, loss: 0.006518794223666191 2023-01-24 08:04:56.782634: step: 264/530, loss: 0.005981508642435074 2023-01-24 08:04:57.819745: step: 268/530, loss: 0.03490021079778671 2023-01-24 08:04:58.852154: step: 272/530, loss: 0.00037004746263846755 2023-01-24 08:04:59.900352: step: 276/530, loss: 0.0023455112241208553 2023-01-24 08:05:00.930028: step: 280/530, loss: 8.950916708272416e-06 2023-01-24 08:05:01.973087: step: 284/530, loss: 7.448644464602694e-05 2023-01-24 08:05:03.026955: step: 288/530, loss: 0.0005203859182074666 2023-01-24 08:05:04.058078: step: 292/530, loss: 0.002128622494637966 2023-01-24 08:05:05.110932: step: 296/530, loss: 0.00027579310699366033 2023-01-24 08:05:06.156630: step: 300/530, loss: 1.741411142575089e-05 2023-01-24 08:05:07.212312: step: 304/530, loss: 0.002726037288084626 2023-01-24 08:05:08.258596: step: 308/530, loss: 0.00011106010060757399 2023-01-24 08:05:09.297099: step: 312/530, loss: 0.0 2023-01-24 08:05:10.348329: step: 316/530, loss: 0.00028838327853009105 2023-01-24 08:05:11.390317: step: 320/530, loss: 0.004911091644316912 2023-01-24 08:05:12.442925: step: 324/530, loss: 0.0007996641797944903 2023-01-24 08:05:13.476973: step: 328/530, loss: 0.0012720789527520537 2023-01-24 08:05:14.536416: step: 332/530, loss: 0.008266856893897057 2023-01-24 08:05:15.587123: step: 336/530, loss: 0.00314516993239522 2023-01-24 08:05:16.620966: step: 340/530, loss: 9.839962876867503e-05 2023-01-24 08:05:17.671274: step: 344/530, loss: 0.001324623473919928 2023-01-24 08:05:18.724013: step: 348/530, loss: 0.0008112098439596593 2023-01-24 08:05:19.756072: step: 352/530, loss: 0.00011970206833211705 2023-01-24 08:05:20.811559: step: 356/530, loss: 0.007163750473409891 2023-01-24 08:05:21.874885: step: 360/530, loss: 0.0012658820487558842 2023-01-24 08:05:22.896062: step: 364/530, loss: 0.0008192802779376507 2023-01-24 08:05:23.951618: step: 368/530, loss: 0.001917996327392757 2023-01-24 08:05:24.988088: step: 372/530, loss: 0.0002513567160349339 2023-01-24 08:05:26.034057: step: 376/530, loss: 0.004647490102797747 2023-01-24 08:05:27.072502: step: 380/530, loss: 0.00022904870274942368 2023-01-24 08:05:28.129623: step: 384/530, loss: 0.0024287542328238487 2023-01-24 08:05:29.181897: step: 388/530, loss: 0.005864972248673439 2023-01-24 08:05:30.232971: step: 392/530, loss: 0.002683364087715745 2023-01-24 08:05:31.274885: step: 396/530, loss: 0.0025851340033113956 2023-01-24 08:05:32.322661: step: 400/530, loss: 0.0019618652295321226 2023-01-24 08:05:33.371937: step: 404/530, loss: 0.00022624812845606357 2023-01-24 08:05:34.425032: step: 408/530, loss: 0.018268143758177757 2023-01-24 08:05:35.486196: step: 412/530, loss: 0.02802874520421028 2023-01-24 08:05:36.536712: step: 416/530, loss: 0.001407139003276825 2023-01-24 08:05:37.585231: step: 420/530, loss: 0.0010604221606627107 2023-01-24 08:05:38.639135: step: 424/530, loss: 0.02815191261470318 2023-01-24 08:05:39.678663: step: 428/530, loss: 0.004729295149445534 2023-01-24 08:05:40.708829: step: 432/530, loss: 1.0240033816444338e-06 2023-01-24 08:05:41.773211: step: 436/530, loss: 0.0020996921230107546 2023-01-24 08:05:42.820941: step: 440/530, loss: 0.005118421744555235 2023-01-24 08:05:43.859204: step: 444/530, loss: 0.008954851888120174 2023-01-24 08:05:44.901059: step: 448/530, loss: 0.0010439646430313587 2023-01-24 08:05:45.951827: step: 452/530, loss: 0.0184810608625412 2023-01-24 08:05:47.005621: step: 456/530, loss: 2.006214708671905e-05 2023-01-24 08:05:48.083324: step: 460/530, loss: 0.00010704037413233891 2023-01-24 08:05:49.121566: step: 464/530, loss: 0.005566218867897987 2023-01-24 08:05:50.181975: step: 468/530, loss: 0.004844698589295149 2023-01-24 08:05:51.217540: step: 472/530, loss: 2.3661985323997214e-05 2023-01-24 08:05:52.262566: step: 476/530, loss: 0.0012873137602582574 2023-01-24 08:05:53.304120: step: 480/530, loss: 0.008623218163847923 2023-01-24 08:05:54.332676: step: 484/530, loss: 0.0004824193601962179 2023-01-24 08:05:55.398688: step: 488/530, loss: 0.0022862600162625313 2023-01-24 08:05:56.432624: step: 492/530, loss: 0.0007822245243005455 2023-01-24 08:05:57.477424: step: 496/530, loss: 0.00011395986803108826 2023-01-24 08:05:58.519159: step: 500/530, loss: 0.00114940176717937 2023-01-24 08:05:59.563615: step: 504/530, loss: 0.0010633916826918721 2023-01-24 08:06:00.621610: step: 508/530, loss: 0.0013889521360397339 2023-01-24 08:06:01.672630: step: 512/530, loss: 0.0019547503907233477 2023-01-24 08:06:02.701561: step: 516/530, loss: 0.0003079283342231065 2023-01-24 08:06:03.745854: step: 520/530, loss: 0.002159843221306801 2023-01-24 08:06:04.791269: step: 524/530, loss: 0.0017030095914378762 2023-01-24 08:06:05.831122: step: 528/530, loss: 0.000291235774056986 2023-01-24 08:06:06.893325: step: 532/530, loss: 0.006097185425460339 2023-01-24 08:06:07.933023: step: 536/530, loss: 0.00015077170974109322 2023-01-24 08:06:08.978907: step: 540/530, loss: 0.0030064077582210302 2023-01-24 08:06:10.025427: step: 544/530, loss: 2.7563430194277316e-05 2023-01-24 08:06:11.066355: step: 548/530, loss: 6.067095000616973e-06 2023-01-24 08:06:12.110964: step: 552/530, loss: 0.007843291386961937 2023-01-24 08:06:13.148033: step: 556/530, loss: 0.00046633571037091315 2023-01-24 08:06:14.201878: step: 560/530, loss: 0.0091286301612854 2023-01-24 08:06:15.250909: step: 564/530, loss: 8.991173672256991e-05 2023-01-24 08:06:16.310815: step: 568/530, loss: 0.0002499464899301529 2023-01-24 08:06:17.353121: step: 572/530, loss: 0.00023953722848091274 2023-01-24 08:06:18.422357: step: 576/530, loss: 0.0010355343110859394 2023-01-24 08:06:19.453409: step: 580/530, loss: 0.013736139982938766 2023-01-24 08:06:20.494606: step: 584/530, loss: 0.006795480847358704 2023-01-24 08:06:21.521576: step: 588/530, loss: 0.0009801766136661172 2023-01-24 08:06:22.562347: step: 592/530, loss: 9.711627171782311e-06 2023-01-24 08:06:23.612265: step: 596/530, loss: 0.006025176029652357 2023-01-24 08:06:24.661283: step: 600/530, loss: 0.0006345068686641753 2023-01-24 08:06:25.690959: step: 604/530, loss: 0.00010796607239171863 2023-01-24 08:06:26.731550: step: 608/530, loss: 0.022064659744501114 2023-01-24 08:06:27.765882: step: 612/530, loss: 0.0009917536517605186 2023-01-24 08:06:28.811091: step: 616/530, loss: 0.0003969916724599898 2023-01-24 08:06:29.860938: step: 620/530, loss: 0.0009577947203069925 2023-01-24 08:06:30.892499: step: 624/530, loss: 0.004058992490172386 2023-01-24 08:06:31.927463: step: 628/530, loss: 0.009625842794775963 2023-01-24 08:06:32.988268: step: 632/530, loss: 0.014803934842348099 2023-01-24 08:06:34.027610: step: 636/530, loss: 0.00020036633941344917 2023-01-24 08:06:35.086957: step: 640/530, loss: 0.006165073253214359 2023-01-24 08:06:36.138309: step: 644/530, loss: 0.00221126526594162 2023-01-24 08:06:37.200953: step: 648/530, loss: 0.003091533202677965 2023-01-24 08:06:38.237144: step: 652/530, loss: 0.001056141685694456 2023-01-24 08:06:39.292468: step: 656/530, loss: 0.0006401028367690742 2023-01-24 08:06:40.346058: step: 660/530, loss: 0.005448830779641867 2023-01-24 08:06:41.402481: step: 664/530, loss: 0.0006278028595261276 2023-01-24 08:06:42.451055: step: 668/530, loss: 0.0010182765545323491 2023-01-24 08:06:43.497891: step: 672/530, loss: 0.011164749041199684 2023-01-24 08:06:44.553167: step: 676/530, loss: 0.0022408654913306236 2023-01-24 08:06:45.598501: step: 680/530, loss: 0.003817001124843955 2023-01-24 08:06:46.647413: step: 684/530, loss: 0.0014193993993103504 2023-01-24 08:06:47.681775: step: 688/530, loss: 0.00926503911614418 2023-01-24 08:06:48.724790: step: 692/530, loss: 0.003855099668726325 2023-01-24 08:06:49.769458: step: 696/530, loss: 9.615978342480958e-05 2023-01-24 08:06:50.808930: step: 700/530, loss: 0.00165564042981714 2023-01-24 08:06:51.840247: step: 704/530, loss: 0.00013659309479407966 2023-01-24 08:06:52.888850: step: 708/530, loss: 0.0037068959791213274 2023-01-24 08:06:53.931247: step: 712/530, loss: 0.000563675130251795 2023-01-24 08:06:54.964325: step: 716/530, loss: 0.0005859659286215901 2023-01-24 08:06:55.988907: step: 720/530, loss: 0.001557123614475131 2023-01-24 08:06:57.039592: step: 724/530, loss: 0.002455672947689891 2023-01-24 08:06:58.090951: step: 728/530, loss: 0.0017205079784616828 2023-01-24 08:06:59.142105: step: 732/530, loss: 0.0038072119932621717 2023-01-24 08:07:00.178726: step: 736/530, loss: 0.00026613465161062777 2023-01-24 08:07:01.209954: step: 740/530, loss: 1.336878995061852e-06 2023-01-24 08:07:02.247401: step: 744/530, loss: 0.0024368404410779476 2023-01-24 08:07:03.288830: step: 748/530, loss: 0.0022249529138207436 2023-01-24 08:07:04.339775: step: 752/530, loss: 0.002513074316084385 2023-01-24 08:07:05.361742: step: 756/530, loss: 0.002031650161370635 2023-01-24 08:07:06.407374: step: 760/530, loss: 0.026250595226883888 2023-01-24 08:07:07.442975: step: 764/530, loss: 0.0004051537252962589 2023-01-24 08:07:08.471167: step: 768/530, loss: 0.002396330703049898 2023-01-24 08:07:09.511195: step: 772/530, loss: 0.0019366589840501547 2023-01-24 08:07:10.552103: step: 776/530, loss: 6.119882982602576e-06 2023-01-24 08:07:11.585364: step: 780/530, loss: 6.379462865879759e-05 2023-01-24 08:07:12.632968: step: 784/530, loss: 0.002453408669680357 2023-01-24 08:07:13.663311: step: 788/530, loss: 0.0001453535951441154 2023-01-24 08:07:14.701249: step: 792/530, loss: 0.00013945973478257656 2023-01-24 08:07:15.734248: step: 796/530, loss: 0.0009795083897188306 2023-01-24 08:07:16.770381: step: 800/530, loss: 0.00011313698632875457 2023-01-24 08:07:17.818920: step: 804/530, loss: 0.00013916977331973612 2023-01-24 08:07:18.855206: step: 808/530, loss: 0.009145022369921207 2023-01-24 08:07:19.892299: step: 812/530, loss: 0.0067528486251831055 2023-01-24 08:07:20.945330: step: 816/530, loss: 3.819125777226873e-05 2023-01-24 08:07:21.975437: step: 820/530, loss: 0.0013857746962457895 2023-01-24 08:07:23.018610: step: 824/530, loss: 1.6716780010028742e-05 2023-01-24 08:07:24.058627: step: 828/530, loss: 7.969896250870079e-05 2023-01-24 08:07:25.103331: step: 832/530, loss: 0.00014966473099775612 2023-01-24 08:07:26.146226: step: 836/530, loss: 0.007192178629338741 2023-01-24 08:07:27.184395: step: 840/530, loss: 0.0028905433136969805 2023-01-24 08:07:28.232682: step: 844/530, loss: 0.0038011521100997925 2023-01-24 08:07:29.281312: step: 848/530, loss: 0.0009843989973887801 2023-01-24 08:07:30.328329: step: 852/530, loss: 0.0031939283944666386 2023-01-24 08:07:31.363514: step: 856/530, loss: 0.0076463669538497925 2023-01-24 08:07:32.416531: step: 860/530, loss: 0.023729044944047928 2023-01-24 08:07:33.473394: step: 864/530, loss: 0.0021684535313397646 2023-01-24 08:07:34.522655: step: 868/530, loss: 9.369548934046179e-05 2023-01-24 08:07:35.561384: step: 872/530, loss: 0.0015189633704721928 2023-01-24 08:07:36.610807: step: 876/530, loss: 0.008067240007221699 2023-01-24 08:07:37.672502: step: 880/530, loss: 0.0008739823824726045 2023-01-24 08:07:38.713610: step: 884/530, loss: 0.0015991192776709795 2023-01-24 08:07:39.759092: step: 888/530, loss: 0.0026988901663571596 2023-01-24 08:07:40.796233: step: 892/530, loss: 0.0003570735570974648 2023-01-24 08:07:41.832323: step: 896/530, loss: 0.0037768923211842775 2023-01-24 08:07:42.861925: step: 900/530, loss: 5.656315988744609e-05 2023-01-24 08:07:43.907882: step: 904/530, loss: 0.0004602005355991423 2023-01-24 08:07:44.948313: step: 908/530, loss: 0.012956167571246624 2023-01-24 08:07:45.979000: step: 912/530, loss: 0.00023429089924320579 2023-01-24 08:07:47.029424: step: 916/530, loss: 0.0005414508050307631 2023-01-24 08:07:48.067204: step: 920/530, loss: 0.003229925176128745 2023-01-24 08:07:49.110983: step: 924/530, loss: 0.00013546341506298631 2023-01-24 08:07:50.155757: step: 928/530, loss: 0.005035614129155874 2023-01-24 08:07:51.204224: step: 932/530, loss: 7.074460154399276e-05 2023-01-24 08:07:52.245026: step: 936/530, loss: 0.003970619756728411 2023-01-24 08:07:53.279453: step: 940/530, loss: 0.007547573186457157 2023-01-24 08:07:54.313016: step: 944/530, loss: 0.001952392398379743 2023-01-24 08:07:55.362582: step: 948/530, loss: 0.0017291156109422445 2023-01-24 08:07:56.407120: step: 952/530, loss: 1.3814047861160361e-06 2023-01-24 08:07:57.451982: step: 956/530, loss: 0.003911504987627268 2023-01-24 08:07:58.491379: step: 960/530, loss: 0.0007108685094863176 2023-01-24 08:07:59.530133: step: 964/530, loss: 0.002414074493572116 2023-01-24 08:08:00.564823: step: 968/530, loss: 0.005062845069915056 2023-01-24 08:08:01.629904: step: 972/530, loss: 0.00020350265549495816 2023-01-24 08:08:02.663764: step: 976/530, loss: 9.916456292557996e-06 2023-01-24 08:08:03.732400: step: 980/530, loss: 0.0009219230269081891 2023-01-24 08:08:04.781123: step: 984/530, loss: 0.0006482011522166431 2023-01-24 08:08:05.835317: step: 988/530, loss: 0.0004915453610010445 2023-01-24 08:08:06.884949: step: 992/530, loss: 0.00047927928972058 2023-01-24 08:08:07.925540: step: 996/530, loss: 0.001487908884882927 2023-01-24 08:08:08.972172: step: 1000/530, loss: 7.026194361969829e-05 2023-01-24 08:08:10.006543: step: 1004/530, loss: 3.7042158510303125e-05 2023-01-24 08:08:11.055165: step: 1008/530, loss: 0.0017732521519064903 2023-01-24 08:08:12.096281: step: 1012/530, loss: 0.0003932069812435657 2023-01-24 08:08:13.141106: step: 1016/530, loss: 0.00988938007503748 2023-01-24 08:08:14.185528: step: 1020/530, loss: 0.008849609643220901 2023-01-24 08:08:15.209563: step: 1024/530, loss: 9.164132279693149e-06 2023-01-24 08:08:16.246157: step: 1028/530, loss: 0.0019211875041946769 2023-01-24 08:08:17.296641: step: 1032/530, loss: 0.0007777855498716235 2023-01-24 08:08:18.325721: step: 1036/530, loss: 0.0002675313444342464 2023-01-24 08:08:19.394418: step: 1040/530, loss: 0.0037446871865540743 2023-01-24 08:08:20.444483: step: 1044/530, loss: 0.0003587371320463717 2023-01-24 08:08:21.470888: step: 1048/530, loss: 0.00118012516759336 2023-01-24 08:08:22.500407: step: 1052/530, loss: 0.0009117811569012702 2023-01-24 08:08:23.540158: step: 1056/530, loss: 0.010774577967822552 2023-01-24 08:08:24.582431: step: 1060/530, loss: 0.0003953362465836108 2023-01-24 08:08:25.615580: step: 1064/530, loss: 0.003877539886161685 2023-01-24 08:08:26.654505: step: 1068/530, loss: 2.943889921880327e-05 2023-01-24 08:08:27.702738: step: 1072/530, loss: 4.294289828976616e-05 2023-01-24 08:08:28.747174: step: 1076/530, loss: 0.00620786240324378 2023-01-24 08:08:29.780189: step: 1080/530, loss: 0.001447570277377963 2023-01-24 08:08:30.816409: step: 1084/530, loss: 0.0009011015063151717 2023-01-24 08:08:31.872311: step: 1088/530, loss: 1.031836859510804e-06 2023-01-24 08:08:32.937307: step: 1092/530, loss: 0.0024762984830886126 2023-01-24 08:08:33.969686: step: 1096/530, loss: 0.0009796727681532502 2023-01-24 08:08:35.020696: step: 1100/530, loss: 0.005562683567404747 2023-01-24 08:08:36.057328: step: 1104/530, loss: 9.833775402512401e-05 2023-01-24 08:08:37.088173: step: 1108/530, loss: 0.0005841218517161906 2023-01-24 08:08:38.131773: step: 1112/530, loss: 0.00743784848600626 2023-01-24 08:08:39.195917: step: 1116/530, loss: 0.026636315509676933 2023-01-24 08:08:40.230089: step: 1120/530, loss: 0.0007572905742563307 2023-01-24 08:08:41.286111: step: 1124/530, loss: 0.0006607124814763665 2023-01-24 08:08:42.322919: step: 1128/530, loss: 0.004514450207352638 2023-01-24 08:08:43.365205: step: 1132/530, loss: 0.0021646092645823956 2023-01-24 08:08:44.396044: step: 1136/530, loss: 0.0009013505768962204 2023-01-24 08:08:45.440241: step: 1140/530, loss: 0.002261790679767728 2023-01-24 08:08:46.476637: step: 1144/530, loss: 0.009272295981645584 2023-01-24 08:08:47.507069: step: 1148/530, loss: 0.001525578205473721 2023-01-24 08:08:48.542826: step: 1152/530, loss: 0.0025265717413276434 2023-01-24 08:08:49.598177: step: 1156/530, loss: 0.00033221999183297157 2023-01-24 08:08:50.631145: step: 1160/530, loss: 3.576509334379807e-05 2023-01-24 08:08:51.677514: step: 1164/530, loss: 0.0006343633285723627 2023-01-24 08:08:52.720600: step: 1168/530, loss: 0.010584630072116852 2023-01-24 08:08:53.758369: step: 1172/530, loss: 0.00030360708478838205 2023-01-24 08:08:54.809874: step: 1176/530, loss: 1.3866609833712573e-06 2023-01-24 08:08:55.838088: step: 1180/530, loss: 0.0016013794811442494 2023-01-24 08:08:56.872538: step: 1184/530, loss: 0.0001446597307221964 2023-01-24 08:08:57.920937: step: 1188/530, loss: 0.0014444533735513687 2023-01-24 08:08:58.952485: step: 1192/530, loss: 0.0006003277376294136 2023-01-24 08:08:59.993378: step: 1196/530, loss: 0.0015239645726978779 2023-01-24 08:09:01.037475: step: 1200/530, loss: 0.006915600039064884 2023-01-24 08:09:02.089616: step: 1204/530, loss: 0.0016340535366907716 2023-01-24 08:09:03.152979: step: 1208/530, loss: 0.005759651307016611 2023-01-24 08:09:04.200087: step: 1212/530, loss: 0.00025268254103139043 2023-01-24 08:09:05.252625: step: 1216/530, loss: 0.004989036358892918 2023-01-24 08:09:06.316544: step: 1220/530, loss: 0.004300558008253574 2023-01-24 08:09:07.361019: step: 1224/530, loss: 0.0009450926445424557 2023-01-24 08:09:08.436424: step: 1228/530, loss: 0.0010944271925836802 2023-01-24 08:09:09.489216: step: 1232/530, loss: 0.002427093219012022 2023-01-24 08:09:10.528504: step: 1236/530, loss: 0.000895948673132807 2023-01-24 08:09:11.567538: step: 1240/530, loss: 0.0011638362193480134 2023-01-24 08:09:12.605781: step: 1244/530, loss: 0.0026391472201794386 2023-01-24 08:09:13.662981: step: 1248/530, loss: 0.004858668893575668 2023-01-24 08:09:14.689399: step: 1252/530, loss: 0.0027947798371315002 2023-01-24 08:09:15.743772: step: 1256/530, loss: 0.0004653006326407194 2023-01-24 08:09:16.794125: step: 1260/530, loss: 0.0011524201836436987 2023-01-24 08:09:17.829452: step: 1264/530, loss: 0.002620370825752616 2023-01-24 08:09:18.879348: step: 1268/530, loss: 0.0065241591073572636 2023-01-24 08:09:19.915600: step: 1272/530, loss: 0.0035955074708908796 2023-01-24 08:09:20.962054: step: 1276/530, loss: 0.0005749856354668736 2023-01-24 08:09:22.025808: step: 1280/530, loss: 0.002244073897600174 2023-01-24 08:09:23.063608: step: 1284/530, loss: 0.0029421034269034863 2023-01-24 08:09:24.101295: step: 1288/530, loss: 0.002565886825323105 2023-01-24 08:09:25.138574: step: 1292/530, loss: 0.005780614446848631 2023-01-24 08:09:26.179233: step: 1296/530, loss: 0.0002358978526899591 2023-01-24 08:09:27.230208: step: 1300/530, loss: 0.003610714105889201 2023-01-24 08:09:28.275465: step: 1304/530, loss: 0.0023282982874661684 2023-01-24 08:09:29.326028: step: 1308/530, loss: 0.0001790036476450041 2023-01-24 08:09:30.370888: step: 1312/530, loss: 0.0048813773319125175 2023-01-24 08:09:31.444251: step: 1316/530, loss: 4.700659337686375e-05 2023-01-24 08:09:32.500586: step: 1320/530, loss: 0.0014433374162763357 2023-01-24 08:09:33.527389: step: 1324/530, loss: 0.00014284891949500889 2023-01-24 08:09:34.580485: step: 1328/530, loss: 0.0016807086067274213 2023-01-24 08:09:35.638592: step: 1332/530, loss: 0.004982365760952234 2023-01-24 08:09:36.696554: step: 1336/530, loss: 0.0050092837773263454 2023-01-24 08:09:37.731974: step: 1340/530, loss: 0.004040142055600882 2023-01-24 08:09:38.766702: step: 1344/530, loss: 0.0052107577212154865 2023-01-24 08:09:39.803269: step: 1348/530, loss: 0.0041431281715631485 2023-01-24 08:09:40.858526: step: 1352/530, loss: 0.0024121892638504505 2023-01-24 08:09:41.890094: step: 1356/530, loss: 0.008282479830086231 2023-01-24 08:09:42.950065: step: 1360/530, loss: 0.0006505693309009075 2023-01-24 08:09:44.001197: step: 1364/530, loss: 0.0016670534387230873 2023-01-24 08:09:45.031585: step: 1368/530, loss: 0.0010452264687046409 2023-01-24 08:09:46.072050: step: 1372/530, loss: 0.0008869652519933879 2023-01-24 08:09:47.120969: step: 1376/530, loss: 0.0010890167905017734 2023-01-24 08:09:48.158247: step: 1380/530, loss: 0.002823673654347658 2023-01-24 08:09:49.217640: step: 1384/530, loss: 0.006408573593944311 2023-01-24 08:09:50.287541: step: 1388/530, loss: 0.002019304782152176 2023-01-24 08:09:51.331934: step: 1392/530, loss: 0.001684128656052053 2023-01-24 08:09:52.379791: step: 1396/530, loss: 0.14118409156799316 2023-01-24 08:09:53.432287: step: 1400/530, loss: 0.006086037028580904 2023-01-24 08:09:54.470771: step: 1404/530, loss: 0.0029782152269035578 2023-01-24 08:09:55.495208: step: 1408/530, loss: 1.072677241609199e-05 2023-01-24 08:09:56.528214: step: 1412/530, loss: 0.0018608147511258721 2023-01-24 08:09:57.591105: step: 1416/530, loss: 0.0002685075451154262 2023-01-24 08:09:58.634650: step: 1420/530, loss: 0.017026811838150024 2023-01-24 08:09:59.679562: step: 1424/530, loss: 0.008269661106169224 2023-01-24 08:10:00.732618: step: 1428/530, loss: 4.369254384073429e-05 2023-01-24 08:10:01.760536: step: 1432/530, loss: 0.0007951008738018572 2023-01-24 08:10:02.794365: step: 1436/530, loss: 0.0016839754534885287 2023-01-24 08:10:03.855471: step: 1440/530, loss: 0.000541744870133698 2023-01-24 08:10:04.905051: step: 1444/530, loss: 3.0239729312597774e-05 2023-01-24 08:10:05.945641: step: 1448/530, loss: 0.00753433583304286 2023-01-24 08:10:06.980079: step: 1452/530, loss: 0.0019085907842963934 2023-01-24 08:10:08.018116: step: 1456/530, loss: 0.00901994202286005 2023-01-24 08:10:09.084444: step: 1460/530, loss: 0.007146323565393686 2023-01-24 08:10:10.130463: step: 1464/530, loss: 0.00172905414365232 2023-01-24 08:10:11.175022: step: 1468/530, loss: 0.005956052336841822 2023-01-24 08:10:12.211097: step: 1472/530, loss: 0.014158985577523708 2023-01-24 08:10:13.250261: step: 1476/530, loss: 0.0020066110882908106 2023-01-24 08:10:14.281618: step: 1480/530, loss: 4.1939885704778135e-05 2023-01-24 08:10:15.325951: step: 1484/530, loss: 7.217737584142014e-05 2023-01-24 08:10:16.379345: step: 1488/530, loss: 0.0016097412444651127 2023-01-24 08:10:17.410183: step: 1492/530, loss: 0.0010121164377778769 2023-01-24 08:10:18.444418: step: 1496/530, loss: 4.968651046510786e-05 2023-01-24 08:10:19.487422: step: 1500/530, loss: 0.00623213080689311 2023-01-24 08:10:20.526471: step: 1504/530, loss: 0.0002086248859995976 2023-01-24 08:10:21.563423: step: 1508/530, loss: 0.001149590709246695 2023-01-24 08:10:22.619007: step: 1512/530, loss: 0.006035902071744204 2023-01-24 08:10:23.648238: step: 1516/530, loss: 0.0028512482531368732 2023-01-24 08:10:24.712234: step: 1520/530, loss: 0.005742454435676336 2023-01-24 08:10:25.732802: step: 1524/530, loss: 0.0010509680723771453 2023-01-24 08:10:26.780417: step: 1528/530, loss: 0.00010907711111940444 2023-01-24 08:10:27.810311: step: 1532/530, loss: 0.004124751314520836 2023-01-24 08:10:28.841351: step: 1536/530, loss: 0.0012129239039495587 2023-01-24 08:10:29.871867: step: 1540/530, loss: 0.0009087308426387608 2023-01-24 08:10:30.905197: step: 1544/530, loss: 0.004887440241873264 2023-01-24 08:10:31.937476: step: 1548/530, loss: 0.0 2023-01-24 08:10:32.994786: step: 1552/530, loss: 0.003754856064915657 2023-01-24 08:10:34.036881: step: 1556/530, loss: 0.0009373383945785463 2023-01-24 08:10:35.100646: step: 1560/530, loss: 0.001886929851025343 2023-01-24 08:10:36.139182: step: 1564/530, loss: 0.005456239450722933 2023-01-24 08:10:37.198994: step: 1568/530, loss: 0.004966110922396183 2023-01-24 08:10:38.243385: step: 1572/530, loss: 0.0017675001872703433 2023-01-24 08:10:39.298767: step: 1576/530, loss: 0.0038811187259852886 2023-01-24 08:10:40.340522: step: 1580/530, loss: 0.006399739999324083 2023-01-24 08:10:41.376749: step: 1584/530, loss: 0.0018490948714315891 2023-01-24 08:10:42.403796: step: 1588/530, loss: 0.0029616185929626226 2023-01-24 08:10:43.440442: step: 1592/530, loss: 0.007141935173422098 2023-01-24 08:10:44.469917: step: 1596/530, loss: 0.00014484429266303778 2023-01-24 08:10:45.533413: step: 1600/530, loss: 0.01417284831404686 2023-01-24 08:10:46.562813: step: 1604/530, loss: 0.002109603490680456 2023-01-24 08:10:47.612937: step: 1608/530, loss: 0.005846297834068537 2023-01-24 08:10:48.650616: step: 1612/530, loss: 0.00015911986702121794 2023-01-24 08:10:49.692534: step: 1616/530, loss: 0.007112887222319841 2023-01-24 08:10:50.740283: step: 1620/530, loss: 0.018406052142381668 2023-01-24 08:10:51.821725: step: 1624/530, loss: 0.00012296879140194505 2023-01-24 08:10:52.853175: step: 1628/530, loss: 0.005481957923620939 2023-01-24 08:10:53.897307: step: 1632/530, loss: 0.0037433719262480736 2023-01-24 08:10:54.919075: step: 1636/530, loss: 0.0011715436121448874 2023-01-24 08:10:55.951877: step: 1640/530, loss: 4.916386023978703e-05 2023-01-24 08:10:57.005616: step: 1644/530, loss: 0.0015766690485179424 2023-01-24 08:10:58.035119: step: 1648/530, loss: 0.0032344404608011246 2023-01-24 08:10:59.060437: step: 1652/530, loss: 0.0077257719822227955 2023-01-24 08:11:00.106980: step: 1656/530, loss: 0.00023749937827233225 2023-01-24 08:11:01.137879: step: 1660/530, loss: 0.005592431407421827 2023-01-24 08:11:02.168471: step: 1664/530, loss: 0.0031693640630692244 2023-01-24 08:11:03.229695: step: 1668/530, loss: 0.0035397526808083057 2023-01-24 08:11:04.256385: step: 1672/530, loss: 0.0005305302329361439 2023-01-24 08:11:05.303899: step: 1676/530, loss: 0.0034351455979049206 2023-01-24 08:11:06.340039: step: 1680/530, loss: 0.0028322439175099134 2023-01-24 08:11:07.395098: step: 1684/530, loss: 0.0005825162515975535 2023-01-24 08:11:08.426340: step: 1688/530, loss: 0.006902835797518492 2023-01-24 08:11:09.456172: step: 1692/530, loss: 0.0014823701931163669 2023-01-24 08:11:10.506072: step: 1696/530, loss: 0.001065253745764494 2023-01-24 08:11:11.556744: step: 1700/530, loss: 0.01789345033466816 2023-01-24 08:11:12.589684: step: 1704/530, loss: 0.002103856299072504 2023-01-24 08:11:13.617899: step: 1708/530, loss: 0.0009596335585229099 2023-01-24 08:11:14.657713: step: 1712/530, loss: 0.00040444484329782426 2023-01-24 08:11:15.710276: step: 1716/530, loss: 0.0002746698446571827 2023-01-24 08:11:16.742349: step: 1720/530, loss: 0.0010927320690825582 2023-01-24 08:11:17.788471: step: 1724/530, loss: 6.922454485902563e-05 2023-01-24 08:11:18.821221: step: 1728/530, loss: 0.002970654983073473 2023-01-24 08:11:19.871952: step: 1732/530, loss: 0.0026557997334748507 2023-01-24 08:11:20.909140: step: 1736/530, loss: 0.005885441321879625 2023-01-24 08:11:21.943054: step: 1740/530, loss: 0.0031337642576545477 2023-01-24 08:11:22.977221: step: 1744/530, loss: 0.004391557537019253 2023-01-24 08:11:24.059980: step: 1748/530, loss: 0.01008619088679552 2023-01-24 08:11:25.079579: step: 1752/530, loss: 0.0005449464661069214 2023-01-24 08:11:26.108329: step: 1756/530, loss: 0.0004244691808708012 2023-01-24 08:11:27.138022: step: 1760/530, loss: 3.0600263016822282e-06 2023-01-24 08:11:28.171248: step: 1764/530, loss: 0.0009252700838260353 2023-01-24 08:11:29.212866: step: 1768/530, loss: 0.002439627656713128 2023-01-24 08:11:30.262947: step: 1772/530, loss: 0.0002417669747956097 2023-01-24 08:11:31.309086: step: 1776/530, loss: 0.004936986602842808 2023-01-24 08:11:32.340034: step: 1780/530, loss: 0.004176536109298468 2023-01-24 08:11:33.397885: step: 1784/530, loss: 0.0015248837880790234 2023-01-24 08:11:34.440638: step: 1788/530, loss: 0.0009485507034696639 2023-01-24 08:11:35.482175: step: 1792/530, loss: 0.000917789526283741 2023-01-24 08:11:36.532948: step: 1796/530, loss: 0.003934743348509073 2023-01-24 08:11:37.592160: step: 1800/530, loss: 0.0017367423279210925 2023-01-24 08:11:38.631420: step: 1804/530, loss: 0.00031899186433292925 2023-01-24 08:11:39.674300: step: 1808/530, loss: 0.0009279457735829055 2023-01-24 08:11:40.706282: step: 1812/530, loss: 0.007400153670459986 2023-01-24 08:11:41.758336: step: 1816/530, loss: 4.4409425754565746e-05 2023-01-24 08:11:42.798277: step: 1820/530, loss: 0.004460947588086128 2023-01-24 08:11:43.837458: step: 1824/530, loss: 3.0821589461993426e-05 2023-01-24 08:11:44.882657: step: 1828/530, loss: 0.002043446758762002 2023-01-24 08:11:45.924592: step: 1832/530, loss: 0.00819195806980133 2023-01-24 08:11:46.961089: step: 1836/530, loss: 0.000686023267917335 2023-01-24 08:11:47.996921: step: 1840/530, loss: 0.00717303017154336 2023-01-24 08:11:49.034811: step: 1844/530, loss: 0.0001378904707962647 2023-01-24 08:11:50.078345: step: 1848/530, loss: 0.000975067843683064 2023-01-24 08:11:51.127905: step: 1852/530, loss: 0.0031472533009946346 2023-01-24 08:11:52.181509: step: 1856/530, loss: 0.0085146464407444 2023-01-24 08:11:53.223655: step: 1860/530, loss: 1.5978568626451306e-05 2023-01-24 08:11:54.271518: step: 1864/530, loss: 0.0018684043316170573 2023-01-24 08:11:55.326518: step: 1868/530, loss: 0.0014190655201673508 2023-01-24 08:11:56.371999: step: 1872/530, loss: 0.00028407294303178787 2023-01-24 08:11:57.405736: step: 1876/530, loss: 0.003862496931105852 2023-01-24 08:11:58.445440: step: 1880/530, loss: 0.0007444398943334818 2023-01-24 08:11:59.475503: step: 1884/530, loss: 0.0008316596504300833 2023-01-24 08:12:00.520542: step: 1888/530, loss: 0.0024567798245698214 2023-01-24 08:12:01.565382: step: 1892/530, loss: 3.7581445212708786e-05 2023-01-24 08:12:02.617331: step: 1896/530, loss: 0.0005281384219415486 2023-01-24 08:12:03.661503: step: 1900/530, loss: 0.0015169217949733138 2023-01-24 08:12:04.704925: step: 1904/530, loss: 2.5921190172084607e-05 2023-01-24 08:12:05.743581: step: 1908/530, loss: 0.0028863977640867233 2023-01-24 08:12:06.793135: step: 1912/530, loss: 0.014135162346065044 2023-01-24 08:12:07.843979: step: 1916/530, loss: 0.0031662173569202423 2023-01-24 08:12:08.881302: step: 1920/530, loss: 0.005211448762565851 2023-01-24 08:12:09.907622: step: 1924/530, loss: 0.008082851767539978 2023-01-24 08:12:10.948752: step: 1928/530, loss: 0.0007151024765335023 2023-01-24 08:12:11.988276: step: 1932/530, loss: 0.021478649228811264 2023-01-24 08:12:13.017729: step: 1936/530, loss: 0.0 2023-01-24 08:12:14.055537: step: 1940/530, loss: 0.0015179453184828162 2023-01-24 08:12:15.094734: step: 1944/530, loss: 0.004567896015942097 2023-01-24 08:12:16.145476: step: 1948/530, loss: 0.00677313469350338 2023-01-24 08:12:17.201009: step: 1952/530, loss: 0.0017850816948339343 2023-01-24 08:12:18.239317: step: 1956/530, loss: 0.024138212203979492 2023-01-24 08:12:19.272430: step: 1960/530, loss: 0.005984392017126083 2023-01-24 08:12:20.318843: step: 1964/530, loss: 0.000849053671117872 2023-01-24 08:12:21.363763: step: 1968/530, loss: 0.00010138084326172248 2023-01-24 08:12:22.410510: step: 1972/530, loss: 0.004166722763329744 2023-01-24 08:12:23.466182: step: 1976/530, loss: 0.0022677145898342133 2023-01-24 08:12:24.507936: step: 1980/530, loss: 5.0635961088119075e-05 2023-01-24 08:12:25.568473: step: 1984/530, loss: 0.004011231940239668 2023-01-24 08:12:26.602687: step: 1988/530, loss: 0.015933707356452942 2023-01-24 08:12:27.645283: step: 1992/530, loss: 0.003142152912914753 2023-01-24 08:12:28.691048: step: 1996/530, loss: 0.0011389505816623569 2023-01-24 08:12:29.725937: step: 2000/530, loss: 0.00748224463313818 2023-01-24 08:12:30.780292: step: 2004/530, loss: 0.008931251242756844 2023-01-24 08:12:31.817576: step: 2008/530, loss: 0.00011959778203163296 2023-01-24 08:12:32.860981: step: 2012/530, loss: 0.005308498162776232 2023-01-24 08:12:33.898024: step: 2016/530, loss: 0.00034672507899813354 2023-01-24 08:12:34.934227: step: 2020/530, loss: 0.01122039183974266 2023-01-24 08:12:35.958545: step: 2024/530, loss: 0.00044637013343162835 2023-01-24 08:12:37.000653: step: 2028/530, loss: 0.0007838958990760148 2023-01-24 08:12:38.026245: step: 2032/530, loss: 0.0021932253148406744 2023-01-24 08:12:39.084358: step: 2036/530, loss: 0.00010908945114351809 2023-01-24 08:12:40.133849: step: 2040/530, loss: 0.0003816072130575776 2023-01-24 08:12:41.189836: step: 2044/530, loss: 0.004653113428503275 2023-01-24 08:12:42.234437: step: 2048/530, loss: 0.0012212434085085988 2023-01-24 08:12:43.288848: step: 2052/530, loss: 0.0019578351639211178 2023-01-24 08:12:44.325549: step: 2056/530, loss: 0.0010203371057286859 2023-01-24 08:12:45.376204: step: 2060/530, loss: 0.003280231961980462 2023-01-24 08:12:46.424995: step: 2064/530, loss: 0.004118583630770445 2023-01-24 08:12:47.457121: step: 2068/530, loss: 0.0024739992804825306 2023-01-24 08:12:48.509236: step: 2072/530, loss: 0.006869019940495491 2023-01-24 08:12:49.555038: step: 2076/530, loss: 0.006774529814720154 2023-01-24 08:12:50.597893: step: 2080/530, loss: 0.0034330282360315323 2023-01-24 08:12:51.650182: step: 2084/530, loss: 0.004724840633571148 2023-01-24 08:12:52.694763: step: 2088/530, loss: 0.0016951600555330515 2023-01-24 08:12:53.734234: step: 2092/530, loss: 0.0011921994155272841 2023-01-24 08:12:54.775232: step: 2096/530, loss: 0.00022403204638976604 2023-01-24 08:12:55.825105: step: 2100/530, loss: 0.0036077210679650307 2023-01-24 08:12:56.868785: step: 2104/530, loss: 0.0007157736108638346 2023-01-24 08:12:57.924254: step: 2108/530, loss: 0.001830795779824257 2023-01-24 08:12:58.972465: step: 2112/530, loss: 0.004905502311885357 2023-01-24 08:13:00.009287: step: 2116/530, loss: 2.134965507138986e-05 2023-01-24 08:13:01.039666: step: 2120/530, loss: 0.0008202884346246719 ================================================== Loss: 0.004 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37360033259423503, 'r': 0.319722485768501, 'f1': 0.34456799591002046}, 'combined': 0.25389220751264663, 'stategy': 1, 'epoch': 16} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3766596987619097, 'r': 0.3898150926524911, 'f1': 0.38312449937299936}, 'combined': 0.2969673153034732, 'stategy': 1, 'epoch': 16} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3915268055997455, 'r': 0.3335778666305232, 'f1': 0.36023675351288054}, 'combined': 0.26543760785159615, 'stategy': 1, 'epoch': 16} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3717670621108563, 'r': 0.3686917831044246, 'f1': 0.37022303647218635}, 'combined': 0.286967138318154, 'stategy': 1, 'epoch': 16} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38297703353635176, 'r': 0.33283393047371745, 'f1': 0.35614920073025197}, 'combined': 0.26242572685386983, 'stategy': 1, 'epoch': 16} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3618026351900417, 'r': 0.3604724784430195, 'f1': 0.3611363319944799}, 'combined': 0.2799238554215586, 'stategy': 1, 'epoch': 16} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 16} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5, 'r': 0.41304347826086957, 'f1': 0.45238095238095233}, 'combined': 0.22619047619047616, 'stategy': 1, 'epoch': 16} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 16} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15} ****************************** Epoch: 17 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 08:15:24.857374: step: 4/530, loss: 0.0014743524370715022 2023-01-24 08:15:25.896490: step: 8/530, loss: 0.00660325912758708 2023-01-24 08:15:26.919174: step: 12/530, loss: 0.002118706936016679 2023-01-24 08:15:27.967122: step: 16/530, loss: 0.01160414982587099 2023-01-24 08:15:29.003318: step: 20/530, loss: 0.000995034002698958 2023-01-24 08:15:30.033094: step: 24/530, loss: 0.0025456808507442474 2023-01-24 08:15:31.077396: step: 28/530, loss: 0.0007189153111539781 2023-01-24 08:15:32.114786: step: 32/530, loss: 0.0004857582098338753 2023-01-24 08:15:33.154363: step: 36/530, loss: 0.0017247971845790744 2023-01-24 08:15:34.190962: step: 40/530, loss: 0.00021397563978098333 2023-01-24 08:15:35.225127: step: 44/530, loss: 0.004515861626714468 2023-01-24 08:15:36.251102: step: 48/530, loss: 0.0005723762442357838 2023-01-24 08:15:37.289486: step: 52/530, loss: 0.0005342873046174645 2023-01-24 08:15:38.317511: step: 56/530, loss: 0.0199979767203331 2023-01-24 08:15:39.350621: step: 60/530, loss: 0.004544694907963276 2023-01-24 08:15:40.402771: step: 64/530, loss: 0.0007314592367038131 2023-01-24 08:15:41.437101: step: 68/530, loss: 0.0029184159357100725 2023-01-24 08:15:42.482926: step: 72/530, loss: 0.0004968098364770412 2023-01-24 08:15:43.523547: step: 76/530, loss: 0.0031347903423011303 2023-01-24 08:15:44.573301: step: 80/530, loss: 0.0010143619729205966 2023-01-24 08:15:45.608438: step: 84/530, loss: 0.00048273411812260747 2023-01-24 08:15:46.647151: step: 88/530, loss: 2.379666329943575e-05 2023-01-24 08:15:47.677059: step: 92/530, loss: 0.0016256897943094373 2023-01-24 08:15:48.715319: step: 96/530, loss: 0.0015957856085151434 2023-01-24 08:15:49.760788: step: 100/530, loss: 0.007323454134166241 2023-01-24 08:15:50.797027: step: 104/530, loss: 0.002840333618223667 2023-01-24 08:15:51.829284: step: 108/530, loss: 0.008337774313986301 2023-01-24 08:15:52.872077: step: 112/530, loss: 0.0181791540235281 2023-01-24 08:15:53.912458: step: 116/530, loss: 5.583392703556456e-05 2023-01-24 08:15:54.941986: step: 120/530, loss: 6.064720309950644e-06 2023-01-24 08:15:56.000740: step: 124/530, loss: 0.005723145324736834 2023-01-24 08:15:57.050217: step: 128/530, loss: 0.017118489369750023 2023-01-24 08:15:58.108004: step: 132/530, loss: 0.021794024854898453 2023-01-24 08:15:59.166593: step: 136/530, loss: 0.010343911126255989 2023-01-24 08:16:00.217516: step: 140/530, loss: 5.1592636737041175e-05 2023-01-24 08:16:01.260821: step: 144/530, loss: 0.023200225085020065 2023-01-24 08:16:02.293564: step: 148/530, loss: 0.00417774822562933 2023-01-24 08:16:03.343628: step: 152/530, loss: 0.00023547696764580905 2023-01-24 08:16:04.381790: step: 156/530, loss: 0.003617009148001671 2023-01-24 08:16:05.418138: step: 160/530, loss: 0.0003376854583621025 2023-01-24 08:16:06.458245: step: 164/530, loss: 0.0007484745001420379 2023-01-24 08:16:07.501549: step: 168/530, loss: 0.00010161162936128676 2023-01-24 08:16:08.539267: step: 172/530, loss: 0.009199620224535465 2023-01-24 08:16:09.574420: step: 176/530, loss: 0.003756369696930051 2023-01-24 08:16:10.625016: step: 180/530, loss: 0.0032707166392356157 2023-01-24 08:16:11.685571: step: 184/530, loss: 0.0004229229816701263 2023-01-24 08:16:12.722420: step: 188/530, loss: 0.0023302605841308832 2023-01-24 08:16:13.764262: step: 192/530, loss: 0.0002956682874355465 2023-01-24 08:16:14.809424: step: 196/530, loss: 0.0005876939394511282 2023-01-24 08:16:15.849056: step: 200/530, loss: 0.004324890673160553 2023-01-24 08:16:16.899650: step: 204/530, loss: 0.0010831811232492328 2023-01-24 08:16:17.935959: step: 208/530, loss: 0.0015409933403134346 2023-01-24 08:16:18.995141: step: 212/530, loss: 0.015628740191459656 2023-01-24 08:16:20.035962: step: 216/530, loss: 4.612496923073195e-05 2023-01-24 08:16:21.078059: step: 220/530, loss: 0.0011591032380238175 2023-01-24 08:16:22.132056: step: 224/530, loss: 0.003789310809224844 2023-01-24 08:16:23.185112: step: 228/530, loss: 0.05970427766442299 2023-01-24 08:16:24.236885: step: 232/530, loss: 0.00018468995403964072 2023-01-24 08:16:25.289681: step: 236/530, loss: 0.0008769754786044359 2023-01-24 08:16:26.337223: step: 240/530, loss: 0.007567410357296467 2023-01-24 08:16:27.377132: step: 244/530, loss: 1.0661425221769605e-05 2023-01-24 08:16:28.419415: step: 248/530, loss: 0.00039061999996192753 2023-01-24 08:16:29.454237: step: 252/530, loss: 0.008116090670228004 2023-01-24 08:16:30.506215: step: 256/530, loss: 0.006383896805346012 2023-01-24 08:16:31.577444: step: 260/530, loss: 0.0008009921293705702 2023-01-24 08:16:32.642345: step: 264/530, loss: 0.006543674506247044 2023-01-24 08:16:33.708905: step: 268/530, loss: 0.0027854307554662228 2023-01-24 08:16:34.748233: step: 272/530, loss: 0.0022404994815587997 2023-01-24 08:16:35.788001: step: 276/530, loss: 8.202244498534128e-05 2023-01-24 08:16:36.829957: step: 280/530, loss: 0.00045637405128218234 2023-01-24 08:16:37.885769: step: 284/530, loss: 0.001067394157871604 2023-01-24 08:16:38.928531: step: 288/530, loss: 0.0037804178427904844 2023-01-24 08:16:39.966132: step: 292/530, loss: 0.002081147860735655 2023-01-24 08:16:41.038302: step: 296/530, loss: 0.005376341287046671 2023-01-24 08:16:42.098423: step: 300/530, loss: 0.0017974644433706999 2023-01-24 08:16:43.150172: step: 304/530, loss: 0.0035429177805781364 2023-01-24 08:16:44.181065: step: 308/530, loss: 0.0031821520533412695 2023-01-24 08:16:45.232354: step: 312/530, loss: 0.003984443377703428 2023-01-24 08:16:46.284973: step: 316/530, loss: 0.002903739921748638 2023-01-24 08:16:47.322641: step: 320/530, loss: 3.6114051908953115e-05 2023-01-24 08:16:48.370226: step: 324/530, loss: 0.001399812987074256 2023-01-24 08:16:49.423140: step: 328/530, loss: 0.0012534570414572954 2023-01-24 08:16:50.466308: step: 332/530, loss: 2.926984234363772e-05 2023-01-24 08:16:51.512707: step: 336/530, loss: 7.785757588862907e-06 2023-01-24 08:16:52.550885: step: 340/530, loss: 0.002381031634286046 2023-01-24 08:16:53.605099: step: 344/530, loss: 0.0032594960648566484 2023-01-24 08:16:54.646038: step: 348/530, loss: 0.00030655748560093343 2023-01-24 08:16:55.700623: step: 352/530, loss: 0.0011889704037457705 2023-01-24 08:16:56.745724: step: 356/530, loss: 0.001804513274691999 2023-01-24 08:16:57.787638: step: 360/530, loss: 0.0006564568029716611 2023-01-24 08:16:58.843264: step: 364/530, loss: 0.0011546405730769038 2023-01-24 08:16:59.902575: step: 368/530, loss: 0.0066480194218456745 2023-01-24 08:17:00.950501: step: 372/530, loss: 0.001040980452671647 2023-01-24 08:17:02.008050: step: 376/530, loss: 0.0015139712486416101 2023-01-24 08:17:03.052074: step: 380/530, loss: 0.004264846444129944 2023-01-24 08:17:04.101721: step: 384/530, loss: 0.002495660213753581 2023-01-24 08:17:05.147998: step: 388/530, loss: 0.001489577116444707 2023-01-24 08:17:06.184367: step: 392/530, loss: 0.0006889705546200275 2023-01-24 08:17:07.228561: step: 396/530, loss: 1.6155940102180466e-05 2023-01-24 08:17:08.263040: step: 400/530, loss: 0.0027616501320153475 2023-01-24 08:17:09.339888: step: 404/530, loss: 0.0005016099312342703 2023-01-24 08:17:10.374628: step: 408/530, loss: 5.982349466648884e-05 2023-01-24 08:17:11.412640: step: 412/530, loss: 0.0021680383943021297 2023-01-24 08:17:12.459203: step: 416/530, loss: 0.0008663540938869119 2023-01-24 08:17:13.494299: step: 420/530, loss: 0.004597248509526253 2023-01-24 08:17:14.537126: step: 424/530, loss: 0.02016008272767067 2023-01-24 08:17:15.592252: step: 428/530, loss: 0.0061422428116202354 2023-01-24 08:17:16.643763: step: 432/530, loss: 0.0020309591200202703 2023-01-24 08:17:17.683884: step: 436/530, loss: 0.0007287589833140373 2023-01-24 08:17:18.729684: step: 440/530, loss: 0.00010903603833867237 2023-01-24 08:17:19.773616: step: 444/530, loss: 0.0007346912170760334 2023-01-24 08:17:20.805116: step: 448/530, loss: 8.541832357877865e-05 2023-01-24 08:17:21.840636: step: 452/530, loss: 0.0005568701890297234 2023-01-24 08:17:22.886416: step: 456/530, loss: 0.002599509200081229 2023-01-24 08:17:23.918223: step: 460/530, loss: 0.006765200290828943 2023-01-24 08:17:24.968025: step: 464/530, loss: 0.004038615617901087 2023-01-24 08:17:26.026267: step: 468/530, loss: 0.0026833934243768454 2023-01-24 08:17:27.065235: step: 472/530, loss: 8.310659904964268e-05 2023-01-24 08:17:28.105693: step: 476/530, loss: 0.0036551819648593664 2023-01-24 08:17:29.160728: step: 480/530, loss: 0.0007989761070348322 2023-01-24 08:17:30.199753: step: 484/530, loss: 0.0016497164033353329 2023-01-24 08:17:31.249534: step: 488/530, loss: 0.009886185638606548 2023-01-24 08:17:32.292330: step: 492/530, loss: 0.0048872074112296104 2023-01-24 08:17:33.332941: step: 496/530, loss: 0.005567581858485937 2023-01-24 08:17:34.390982: step: 500/530, loss: 0.005139694083482027 2023-01-24 08:17:35.435093: step: 504/530, loss: 2.5667219233582728e-05 2023-01-24 08:17:36.472751: step: 508/530, loss: 0.00192461593542248 2023-01-24 08:17:37.520501: step: 512/530, loss: 0.00033468438778072596 2023-01-24 08:17:38.547519: step: 516/530, loss: 0.00022340647410601377 2023-01-24 08:17:39.579447: step: 520/530, loss: 0.0 2023-01-24 08:17:40.607483: step: 524/530, loss: 0.00043057568836957216 2023-01-24 08:17:41.667612: step: 528/530, loss: 0.008411814458668232 2023-01-24 08:17:42.711324: step: 532/530, loss: 0.001558232237584889 2023-01-24 08:17:43.760878: step: 536/530, loss: 0.00020881154341623187 2023-01-24 08:17:44.820692: step: 540/530, loss: 0.0002815257175825536 2023-01-24 08:17:45.865603: step: 544/530, loss: 0.004458381794393063 2023-01-24 08:17:46.916476: step: 548/530, loss: 0.0006919911247678101 2023-01-24 08:17:47.963072: step: 552/530, loss: 0.0032196755055338144 2023-01-24 08:17:49.028469: step: 556/530, loss: 0.014050937257707119 2023-01-24 08:17:50.058003: step: 560/530, loss: 0.00042544055031612515 2023-01-24 08:17:51.099314: step: 564/530, loss: 0.0019391147652640939 2023-01-24 08:17:52.128260: step: 568/530, loss: 0.006159898359328508 2023-01-24 08:17:53.157616: step: 572/530, loss: 4.290868673706427e-05 2023-01-24 08:17:54.202069: step: 576/530, loss: 0.02716648392379284 2023-01-24 08:17:55.243053: step: 580/530, loss: 0.004047059919685125 2023-01-24 08:17:56.282933: step: 584/530, loss: 0.030086390674114227 2023-01-24 08:17:57.384798: step: 588/530, loss: 0.006701093167066574 2023-01-24 08:17:58.420649: step: 592/530, loss: 0.010631301440298557 2023-01-24 08:17:59.472387: step: 596/530, loss: 0.0011468518059700727 2023-01-24 08:18:00.533208: step: 600/530, loss: 0.00012781946861650795 2023-01-24 08:18:01.577290: step: 604/530, loss: 0.0058357068337500095 2023-01-24 08:18:02.634233: step: 608/530, loss: 0.005029411055147648 2023-01-24 08:18:03.679904: step: 612/530, loss: 0.0014399680076166987 2023-01-24 08:18:04.729397: step: 616/530, loss: 0.022985175251960754 2023-01-24 08:18:05.764081: step: 620/530, loss: 0.0028079496696591377 2023-01-24 08:18:06.802291: step: 624/530, loss: 0.00388165982440114 2023-01-24 08:18:07.856498: step: 628/530, loss: 0.004202249925583601 2023-01-24 08:18:08.888097: step: 632/530, loss: 9.889141074381769e-05 2023-01-24 08:18:09.945561: step: 636/530, loss: 0.0028493842110037804 2023-01-24 08:18:10.981753: step: 640/530, loss: 0.013812733814120293 2023-01-24 08:18:12.034221: step: 644/530, loss: 0.0009513215045444667 2023-01-24 08:18:13.081248: step: 648/530, loss: 0.006368516478687525 2023-01-24 08:18:14.112484: step: 652/530, loss: 0.0006524188793264329 2023-01-24 08:18:15.159105: step: 656/530, loss: 0.0005199095467105508 2023-01-24 08:18:16.186836: step: 660/530, loss: 0.0009050218504853547 2023-01-24 08:18:17.216238: step: 664/530, loss: 0.0006994634750299156 2023-01-24 08:18:18.248929: step: 668/530, loss: 0.03267935663461685 2023-01-24 08:18:19.288948: step: 672/530, loss: 0.004737501032650471 2023-01-24 08:18:20.336156: step: 676/530, loss: 0.009582619182765484 2023-01-24 08:18:21.376009: step: 680/530, loss: 0.0015747654251754284 2023-01-24 08:18:22.420357: step: 684/530, loss: 0.00012585647345986217 2023-01-24 08:18:23.463888: step: 688/530, loss: 5.6749038776615635e-05 2023-01-24 08:18:24.505851: step: 692/530, loss: 0.002744994591921568 2023-01-24 08:18:25.553549: step: 696/530, loss: 0.00013972545275464654 2023-01-24 08:18:26.596969: step: 700/530, loss: 0.002954637398943305 2023-01-24 08:18:27.647949: step: 704/530, loss: 0.0026447754353284836 2023-01-24 08:18:28.698355: step: 708/530, loss: 0.0026327811647206545 2023-01-24 08:18:29.745939: step: 712/530, loss: 0.0020958720706403255 2023-01-24 08:18:30.782397: step: 716/530, loss: 0.0012459418503567576 2023-01-24 08:18:31.810984: step: 720/530, loss: 0.004910951945930719 2023-01-24 08:18:32.856269: step: 724/530, loss: 0.0011317277094349265 2023-01-24 08:18:33.898315: step: 728/530, loss: 0.0038981973193585873 2023-01-24 08:18:34.937637: step: 732/530, loss: 0.0024162873160094023 2023-01-24 08:18:35.963727: step: 736/530, loss: 0.002626921283081174 2023-01-24 08:18:37.002999: step: 740/530, loss: 5.8769681345438585e-05 2023-01-24 08:18:38.046061: step: 744/530, loss: 3.639415126599488e-06 2023-01-24 08:18:39.083824: step: 748/530, loss: 0.003267729887738824 2023-01-24 08:18:40.123770: step: 752/530, loss: 0.0011516103986650705 2023-01-24 08:18:41.179464: step: 756/530, loss: 0.008302648551762104 2023-01-24 08:18:42.226085: step: 760/530, loss: 0.002034844597801566 2023-01-24 08:18:43.271219: step: 764/530, loss: 0.0019169322913512588 2023-01-24 08:18:44.299764: step: 768/530, loss: 0.0002494501241017133 2023-01-24 08:18:45.371761: step: 772/530, loss: 0.0040806373581290245 2023-01-24 08:18:46.425259: step: 776/530, loss: 0.002027878537774086 2023-01-24 08:18:47.477034: step: 780/530, loss: 0.00392110412940383 2023-01-24 08:18:48.530712: step: 784/530, loss: 0.0017771513666957617 2023-01-24 08:18:49.593400: step: 788/530, loss: 0.0020230517257004976 2023-01-24 08:18:50.659760: step: 792/530, loss: 0.0038418262265622616 2023-01-24 08:18:51.729845: step: 796/530, loss: 0.0003984452341683209 2023-01-24 08:18:52.776396: step: 800/530, loss: 0.0006332120974548161 2023-01-24 08:18:53.813099: step: 804/530, loss: 0.0005243832711130381 2023-01-24 08:18:54.857917: step: 808/530, loss: 0.0011281610932201147 2023-01-24 08:18:55.887112: step: 812/530, loss: 0.00019324151799082756 2023-01-24 08:18:56.938903: step: 816/530, loss: 0.003829157678410411 2023-01-24 08:18:57.989685: step: 820/530, loss: 0.0007295019458979368 2023-01-24 08:18:59.026129: step: 824/530, loss: 0.000566175440326333 2023-01-24 08:19:00.075295: step: 828/530, loss: 2.1496136923815357e-06 2023-01-24 08:19:01.133099: step: 832/530, loss: 0.004715491086244583 2023-01-24 08:19:02.207008: step: 836/530, loss: 0.0002592035452835262 2023-01-24 08:19:03.262656: step: 840/530, loss: 0.005107673816382885 2023-01-24 08:19:04.305539: step: 844/530, loss: 1.848885767685715e-05 2023-01-24 08:19:05.346029: step: 848/530, loss: 0.018713941797614098 2023-01-24 08:19:06.396505: step: 852/530, loss: 0.00025651376927271485 2023-01-24 08:19:07.430923: step: 856/530, loss: 0.005111071281135082 2023-01-24 08:19:08.472729: step: 860/530, loss: 0.0030666294042021036 2023-01-24 08:19:09.512995: step: 864/530, loss: 7.297576303244568e-06 2023-01-24 08:19:10.551465: step: 868/530, loss: 6.415243842639029e-05 2023-01-24 08:19:11.594856: step: 872/530, loss: 2.8920791010023095e-05 2023-01-24 08:19:12.671409: step: 876/530, loss: 0.0132964001968503 2023-01-24 08:19:13.706251: step: 880/530, loss: 7.976187043823302e-05 2023-01-24 08:19:14.750568: step: 884/530, loss: 0.0013392781838774681 2023-01-24 08:19:15.790248: step: 888/530, loss: 0.00027853852952830493 2023-01-24 08:19:16.835089: step: 892/530, loss: 0.00486866245046258 2023-01-24 08:19:17.858978: step: 896/530, loss: 0.00013463993673212826 2023-01-24 08:19:18.895058: step: 900/530, loss: 0.00016759242862462997 2023-01-24 08:19:19.920512: step: 904/530, loss: 0.0003341655246913433 2023-01-24 08:19:20.963824: step: 908/530, loss: 0.013280771672725677 2023-01-24 08:19:22.022602: step: 912/530, loss: 0.0018408300820738077 2023-01-24 08:19:23.043758: step: 916/530, loss: 0.0037589133717119694 2023-01-24 08:19:24.094277: step: 920/530, loss: 0.00534787168726325 2023-01-24 08:19:25.127923: step: 924/530, loss: 0.005053365603089333 2023-01-24 08:19:26.153212: step: 928/530, loss: 0.006376977544277906 2023-01-24 08:19:27.200681: step: 932/530, loss: 0.0014519501710310578 2023-01-24 08:19:28.249161: step: 936/530, loss: 0.010115046985447407 2023-01-24 08:19:29.293202: step: 940/530, loss: 0.0023108532186597586 2023-01-24 08:19:30.339149: step: 944/530, loss: 0.002152229892089963 2023-01-24 08:19:31.375370: step: 948/530, loss: 0.0024788787122815847 2023-01-24 08:19:32.419298: step: 952/530, loss: 0.0013619255041703582 2023-01-24 08:19:33.471651: step: 956/530, loss: 0.000624710984993726 2023-01-24 08:19:34.518106: step: 960/530, loss: 0.00013595822383649647 2023-01-24 08:19:35.551623: step: 964/530, loss: 0.00014411963638849556 2023-01-24 08:19:36.617008: step: 968/530, loss: 0.0028496801387518644 2023-01-24 08:19:37.670302: step: 972/530, loss: 0.0010090307332575321 2023-01-24 08:19:38.706099: step: 976/530, loss: 3.6769513371837093e-06 2023-01-24 08:19:39.749298: step: 980/530, loss: 0.0012742517283186316 2023-01-24 08:19:40.784609: step: 984/530, loss: 2.5884797651087865e-05 2023-01-24 08:19:41.821866: step: 988/530, loss: 0.002917702542617917 2023-01-24 08:19:42.850473: step: 992/530, loss: 0.0004270431527402252 2023-01-24 08:19:43.912567: step: 996/530, loss: 0.007105897180736065 2023-01-24 08:19:44.959231: step: 1000/530, loss: 0.012625468894839287 2023-01-24 08:19:45.998012: step: 1004/530, loss: 0.0006448804051615298 2023-01-24 08:19:47.030727: step: 1008/530, loss: 8.455122952000238e-06 2023-01-24 08:19:48.076780: step: 1012/530, loss: 0.010775727219879627 2023-01-24 08:19:49.125086: step: 1016/530, loss: 0.015372917987406254 2023-01-24 08:19:50.186022: step: 1020/530, loss: 3.2752694096416235e-05 2023-01-24 08:19:51.222738: step: 1024/530, loss: 0.0005106040043756366 2023-01-24 08:19:52.269101: step: 1028/530, loss: 0.004319041967391968 2023-01-24 08:19:53.317534: step: 1032/530, loss: 0.0005803979001939297 2023-01-24 08:19:54.372596: step: 1036/530, loss: 0.007393084466457367 2023-01-24 08:19:55.412667: step: 1040/530, loss: 0.002379234414547682 2023-01-24 08:19:56.459270: step: 1044/530, loss: 1.481946947023971e-05 2023-01-24 08:19:57.497969: step: 1048/530, loss: 0.002936218399554491 2023-01-24 08:19:58.542665: step: 1052/530, loss: 0.00012736863573081791 2023-01-24 08:19:59.564791: step: 1056/530, loss: 0.0031776016112416983 2023-01-24 08:20:00.604784: step: 1060/530, loss: 0.0005582341109402478 2023-01-24 08:20:01.642799: step: 1064/530, loss: 7.450579597723106e-10 2023-01-24 08:20:02.696847: step: 1068/530, loss: 0.00015753437764942646 2023-01-24 08:20:03.755249: step: 1072/530, loss: 0.0001855352020356804 2023-01-24 08:20:04.789640: step: 1076/530, loss: 0.0002511170459911227 2023-01-24 08:20:05.836271: step: 1080/530, loss: 0.0008574594976380467 2023-01-24 08:20:06.907153: step: 1084/530, loss: 0.002710574772208929 2023-01-24 08:20:07.949939: step: 1088/530, loss: 0.002738569863140583 2023-01-24 08:20:08.999854: step: 1092/530, loss: 0.0011903155827894807 2023-01-24 08:20:10.039044: step: 1096/530, loss: 0.0020000950898975134 2023-01-24 08:20:11.077641: step: 1100/530, loss: 0.0005451919860206544 2023-01-24 08:20:12.125209: step: 1104/530, loss: 0.0007610819302499294 2023-01-24 08:20:13.177373: step: 1108/530, loss: 0.0018874533707275987 2023-01-24 08:20:14.210688: step: 1112/530, loss: 0.0027790465392172337 2023-01-24 08:20:15.247912: step: 1116/530, loss: 0.0008909351308830082 2023-01-24 08:20:16.274895: step: 1120/530, loss: 0.00036288020783104 2023-01-24 08:20:17.304658: step: 1124/530, loss: 0.00010466423555044457 2023-01-24 08:20:18.352120: step: 1128/530, loss: 0.0023218560963869095 2023-01-24 08:20:19.391413: step: 1132/530, loss: 0.0005401301896199584 2023-01-24 08:20:20.426446: step: 1136/530, loss: 0.012105298228561878 2023-01-24 08:20:21.474755: step: 1140/530, loss: 0.001272443332709372 2023-01-24 08:20:22.504159: step: 1144/530, loss: 9.497204700892325e-06 2023-01-24 08:20:23.551606: step: 1148/530, loss: 0.005656037945300341 2023-01-24 08:20:24.606061: step: 1152/530, loss: 2.7103656975668855e-05 2023-01-24 08:20:25.680051: step: 1156/530, loss: 0.0023644412867724895 2023-01-24 08:20:26.737038: step: 1160/530, loss: 0.0036779786460101604 2023-01-24 08:20:27.785327: step: 1164/530, loss: 3.727248986251652e-05 2023-01-24 08:20:28.846964: step: 1168/530, loss: 0.0007619143580086529 2023-01-24 08:20:29.888649: step: 1172/530, loss: 0.0024293025489896536 2023-01-24 08:20:30.919342: step: 1176/530, loss: 0.0017884676344692707 2023-01-24 08:20:31.953189: step: 1180/530, loss: 3.6654913060374383e-07 2023-01-24 08:20:33.014641: step: 1184/530, loss: 0.004959250334650278 2023-01-24 08:20:34.049867: step: 1188/530, loss: 6.564982322743163e-05 2023-01-24 08:20:35.118926: step: 1192/530, loss: 0.0008088112226687372 2023-01-24 08:20:36.169301: step: 1196/530, loss: 0.00635934341698885 2023-01-24 08:20:37.222309: step: 1200/530, loss: 0.0006574150756932795 2023-01-24 08:20:38.267742: step: 1204/530, loss: 0.004455378279089928 2023-01-24 08:20:39.315634: step: 1208/530, loss: 0.007044309284538031 2023-01-24 08:20:40.360262: step: 1212/530, loss: 0.0062496899627149105 2023-01-24 08:20:41.401064: step: 1216/530, loss: 0.0003697865759022534 2023-01-24 08:20:42.437081: step: 1220/530, loss: 0.003998305648565292 2023-01-24 08:20:43.487312: step: 1224/530, loss: 1.3274652701511513e-05 2023-01-24 08:20:44.532461: step: 1228/530, loss: 2.0823786144319456e-06 2023-01-24 08:20:45.571235: step: 1232/530, loss: 0.0029414610471576452 2023-01-24 08:20:46.620843: step: 1236/530, loss: 0.0066087194718420506 2023-01-24 08:20:47.663701: step: 1240/530, loss: 0.0093551529571414 2023-01-24 08:20:48.699516: step: 1244/530, loss: 4.7026074753375724e-05 2023-01-24 08:20:49.738290: step: 1248/530, loss: 0.0009934622794389725 2023-01-24 08:20:50.763042: step: 1252/530, loss: 0.0014768776018172503 2023-01-24 08:20:51.799790: step: 1256/530, loss: 0.005098074674606323 2023-01-24 08:20:52.852236: step: 1260/530, loss: 0.0029661257285624743 2023-01-24 08:20:53.908847: step: 1264/530, loss: 0.008504141122102737 2023-01-24 08:20:54.942348: step: 1268/530, loss: 0.007768355775624514 2023-01-24 08:20:55.971478: step: 1272/530, loss: 0.009733738377690315 2023-01-24 08:20:57.007658: step: 1276/530, loss: 0.006573773920536041 2023-01-24 08:20:58.056830: step: 1280/530, loss: 0.0030824884306639433 2023-01-24 08:20:59.094792: step: 1284/530, loss: 0.00023663269530516118 2023-01-24 08:21:00.151852: step: 1288/530, loss: 0.00348040834069252 2023-01-24 08:21:01.184796: step: 1292/530, loss: 0.0002557382686063647 2023-01-24 08:21:02.234340: step: 1296/530, loss: 0.0077478475868701935 2023-01-24 08:21:03.266034: step: 1300/530, loss: 3.6717724469781388e-06 2023-01-24 08:21:04.309508: step: 1304/530, loss: 0.01011281181126833 2023-01-24 08:21:05.347128: step: 1308/530, loss: 0.00012698242790065706 2023-01-24 08:21:06.394538: step: 1312/530, loss: 0.0010995978955179453 2023-01-24 08:21:07.446452: step: 1316/530, loss: 0.006591064855456352 2023-01-24 08:21:08.486449: step: 1320/530, loss: 0.0014081959379836917 2023-01-24 08:21:09.524416: step: 1324/530, loss: 0.00040577526669949293 2023-01-24 08:21:10.565465: step: 1328/530, loss: 0.00079535529948771 2023-01-24 08:21:11.602193: step: 1332/530, loss: 0.017213430255651474 2023-01-24 08:21:12.651677: step: 1336/530, loss: 0.003896152600646019 2023-01-24 08:21:13.689787: step: 1340/530, loss: 0.0015305011766031384 2023-01-24 08:21:14.738884: step: 1344/530, loss: 0.0011044359998777509 2023-01-24 08:21:15.794441: step: 1348/530, loss: 0.0010472419671714306 2023-01-24 08:21:16.828477: step: 1352/530, loss: 1.4220464436220936e-05 2023-01-24 08:21:17.874897: step: 1356/530, loss: 0.0015217718901112676 2023-01-24 08:21:18.921565: step: 1360/530, loss: 0.004007177427411079 2023-01-24 08:21:19.971474: step: 1364/530, loss: 0.0004316438571549952 2023-01-24 08:21:21.016981: step: 1368/530, loss: 2.871344804589171e-05 2023-01-24 08:21:22.046349: step: 1372/530, loss: 0.004065626300871372 2023-01-24 08:21:23.084305: step: 1376/530, loss: 0.0023687719367444515 2023-01-24 08:21:24.160714: step: 1380/530, loss: 0.020276281982660294 2023-01-24 08:21:25.221411: step: 1384/530, loss: 0.00659647723659873 2023-01-24 08:21:26.252093: step: 1388/530, loss: 0.0038783797062933445 2023-01-24 08:21:27.287212: step: 1392/530, loss: 0.00040550841367803514 2023-01-24 08:21:28.343560: step: 1396/530, loss: 0.0013393174158409238 2023-01-24 08:21:29.376897: step: 1400/530, loss: 0.0014298626920208335 2023-01-24 08:21:30.416699: step: 1404/530, loss: 0.0005542111466638744 2023-01-24 08:21:31.458615: step: 1408/530, loss: 0.000135309252073057 2023-01-24 08:21:32.517130: step: 1412/530, loss: 0.0005626199417747557 2023-01-24 08:21:33.566269: step: 1416/530, loss: 2.960778510896489e-05 2023-01-24 08:21:34.616208: step: 1420/530, loss: 0.0037976473104208708 2023-01-24 08:21:35.682981: step: 1424/530, loss: 0.001377007574774325 2023-01-24 08:21:36.731480: step: 1428/530, loss: 0.0018332034815102816 2023-01-24 08:21:37.797661: step: 1432/530, loss: 0.007953077554702759 2023-01-24 08:21:38.833170: step: 1436/530, loss: 0.0052063949406147 2023-01-24 08:21:39.884969: step: 1440/530, loss: 0.0015658732736483216 2023-01-24 08:21:40.926039: step: 1444/530, loss: 0.002678680932149291 2023-01-24 08:21:41.974992: step: 1448/530, loss: 0.00779002346098423 2023-01-24 08:21:43.000554: step: 1452/530, loss: 0.00023047183640301228 2023-01-24 08:21:44.039927: step: 1456/530, loss: 0.001487205969169736 2023-01-24 08:21:45.083206: step: 1460/530, loss: 0.0004775534034706652 2023-01-24 08:21:46.111014: step: 1464/530, loss: 0.0004770010127685964 2023-01-24 08:21:47.174275: step: 1468/530, loss: 0.006879845168441534 2023-01-24 08:21:48.224483: step: 1472/530, loss: 0.00727675249800086 2023-01-24 08:21:49.264781: step: 1476/530, loss: 0.0021079510916024446 2023-01-24 08:21:50.322961: step: 1480/530, loss: 0.00044240037095732987 2023-01-24 08:21:51.376824: step: 1484/530, loss: 0.024879442527890205 2023-01-24 08:21:52.410236: step: 1488/530, loss: 0.0005003334954380989 2023-01-24 08:21:53.438456: step: 1492/530, loss: 0.0004626781155820936 2023-01-24 08:21:54.480731: step: 1496/530, loss: 0.0029468259308487177 2023-01-24 08:21:55.509363: step: 1500/530, loss: 0.00016428811068180948 2023-01-24 08:21:56.545734: step: 1504/530, loss: 0.002816026797518134 2023-01-24 08:21:57.589725: step: 1508/530, loss: 0.002994521288201213 2023-01-24 08:21:58.651951: step: 1512/530, loss: 0.0026726245414465666 2023-01-24 08:21:59.700715: step: 1516/530, loss: 0.0006311832694336772 2023-01-24 08:22:00.751584: step: 1520/530, loss: 0.003284927923232317 2023-01-24 08:22:01.790504: step: 1524/530, loss: 0.00898159109055996 2023-01-24 08:22:02.842697: step: 1528/530, loss: 2.0823752322485234e-07 2023-01-24 08:22:03.905392: step: 1532/530, loss: 3.719169399118982e-05 2023-01-24 08:22:04.943960: step: 1536/530, loss: 0.0058005014434456825 2023-01-24 08:22:05.984287: step: 1540/530, loss: 0.0009148807148449123 2023-01-24 08:22:07.015972: step: 1544/530, loss: 0.0020848149433732033 2023-01-24 08:22:08.056993: step: 1548/530, loss: 0.0022066296078264713 2023-01-24 08:22:09.102041: step: 1552/530, loss: 0.0039602844044566154 2023-01-24 08:22:10.126157: step: 1556/530, loss: 0.0038585748989135027 2023-01-24 08:22:11.168159: step: 1560/530, loss: 7.122480747057125e-05 2023-01-24 08:22:12.234040: step: 1564/530, loss: 0.004375799093395472 2023-01-24 08:22:13.267093: step: 1568/530, loss: 0.00020374795712996274 2023-01-24 08:22:14.291502: step: 1572/530, loss: 0.0003176661266479641 2023-01-24 08:22:15.327621: step: 1576/530, loss: 0.0013383544282987714 2023-01-24 08:22:16.360907: step: 1580/530, loss: 0.001447192276827991 2023-01-24 08:22:17.402273: step: 1584/530, loss: 0.0007889055996201932 2023-01-24 08:22:18.456215: step: 1588/530, loss: 0.00020421612134668976 2023-01-24 08:22:19.493704: step: 1592/530, loss: 0.003952106926590204 2023-01-24 08:22:20.542821: step: 1596/530, loss: 0.006382076535373926 2023-01-24 08:22:21.582626: step: 1600/530, loss: 0.006570099852979183 2023-01-24 08:22:22.641684: step: 1604/530, loss: 0.015949079766869545 2023-01-24 08:22:23.686178: step: 1608/530, loss: 4.006120889243903e-06 2023-01-24 08:22:24.737248: step: 1612/530, loss: 0.00044259443529881537 2023-01-24 08:22:25.782862: step: 1616/530, loss: 0.005342657212167978 2023-01-24 08:22:26.820080: step: 1620/530, loss: 0.0004579670785460621 2023-01-24 08:22:27.853913: step: 1624/530, loss: 4.0859784348867834e-05 2023-01-24 08:22:28.895923: step: 1628/530, loss: 4.779320443049073e-05 2023-01-24 08:22:29.919392: step: 1632/530, loss: 0.005063971038907766 2023-01-24 08:22:30.958925: step: 1636/530, loss: 0.0002617494319565594 2023-01-24 08:22:31.998957: step: 1640/530, loss: 0.0023489685263484716 2023-01-24 08:22:33.065446: step: 1644/530, loss: 0.0011899148812517524 2023-01-24 08:22:34.099804: step: 1648/530, loss: 0.0027415677905082703 2023-01-24 08:22:35.137644: step: 1652/530, loss: 0.0017388095147907734 2023-01-24 08:22:36.204492: step: 1656/530, loss: 0.005948937032371759 2023-01-24 08:22:37.264962: step: 1660/530, loss: 0.00978368055075407 2023-01-24 08:22:38.303479: step: 1664/530, loss: 0.002595794154331088 2023-01-24 08:22:39.348509: step: 1668/530, loss: 0.002223603194579482 2023-01-24 08:22:40.404761: step: 1672/530, loss: 5.623222477879608e-06 2023-01-24 08:22:41.450648: step: 1676/530, loss: 8.900025568436831e-05 2023-01-24 08:22:42.512049: step: 1680/530, loss: 0.00045209366362541914 2023-01-24 08:22:43.544180: step: 1684/530, loss: 0.000723404111340642 2023-01-24 08:22:44.574865: step: 1688/530, loss: 0.00010239532275591046 2023-01-24 08:22:45.619339: step: 1692/530, loss: 0.0004662133869715035 2023-01-24 08:22:46.671379: step: 1696/530, loss: 0.0013345240149646997 2023-01-24 08:22:47.719139: step: 1700/530, loss: 0.0016835578717291355 2023-01-24 08:22:48.765202: step: 1704/530, loss: 0.004374376963824034 2023-01-24 08:22:49.790905: step: 1708/530, loss: 0.0007663400028832257 2023-01-24 08:22:50.857419: step: 1712/530, loss: 0.0030346272978931665 2023-01-24 08:22:51.894717: step: 1716/530, loss: 0.00024776384816505015 2023-01-24 08:22:52.931317: step: 1720/530, loss: 0.008117184974253178 2023-01-24 08:22:53.981433: step: 1724/530, loss: 0.0002365930558880791 2023-01-24 08:22:55.008293: step: 1728/530, loss: 0.00017739305621944368 2023-01-24 08:22:56.057109: step: 1732/530, loss: 0.0006980485050007701 2023-01-24 08:22:57.092375: step: 1736/530, loss: 0.00016968268027994782 2023-01-24 08:22:58.138543: step: 1740/530, loss: 1.7430177194910357e-06 2023-01-24 08:22:59.184293: step: 1744/530, loss: 0.00795839074999094 2023-01-24 08:23:00.225079: step: 1748/530, loss: 0.000318115227855742 2023-01-24 08:23:01.267679: step: 1752/530, loss: 2.864673547264829e-07 2023-01-24 08:23:02.305545: step: 1756/530, loss: 0.0045907762832939625 2023-01-24 08:23:03.332888: step: 1760/530, loss: 0.006999340374022722 2023-01-24 08:23:04.374245: step: 1764/530, loss: 0.003867608727887273 2023-01-24 08:23:05.417010: step: 1768/530, loss: 6.396664684871212e-05 2023-01-24 08:23:06.452241: step: 1772/530, loss: 6.110750837251544e-05 2023-01-24 08:23:07.483290: step: 1776/530, loss: 4.9452672101324424e-05 2023-01-24 08:23:08.524033: step: 1780/530, loss: 0.0018139004241675138 2023-01-24 08:23:09.558026: step: 1784/530, loss: 0.0018237457843497396 2023-01-24 08:23:10.617545: step: 1788/530, loss: 0.0001298043061979115 2023-01-24 08:23:11.658757: step: 1792/530, loss: 0.0010824294295161963 2023-01-24 08:23:12.695470: step: 1796/530, loss: 0.004212304949760437 2023-01-24 08:23:13.733867: step: 1800/530, loss: 0.0006548843230120838 2023-01-24 08:23:14.784067: step: 1804/530, loss: 0.001118526328355074 2023-01-24 08:23:15.816448: step: 1808/530, loss: 0.005350269842892885 2023-01-24 08:23:16.857671: step: 1812/530, loss: 0.000562014989554882 2023-01-24 08:23:17.883620: step: 1816/530, loss: 0.00014336747699417174 2023-01-24 08:23:18.922133: step: 1820/530, loss: 0.0007651003543287516 2023-01-24 08:23:19.966797: step: 1824/530, loss: 0.0036428223829716444 2023-01-24 08:23:21.020359: step: 1828/530, loss: 0.0010677709942683578 2023-01-24 08:23:22.060107: step: 1832/530, loss: 0.002514310646802187 2023-01-24 08:23:23.108115: step: 1836/530, loss: 0.007211413234472275 2023-01-24 08:23:24.156130: step: 1840/530, loss: 0.0011656152782961726 2023-01-24 08:23:25.200393: step: 1844/530, loss: 0.0015326207503676414 2023-01-24 08:23:26.243808: step: 1848/530, loss: 0.014549612067639828 2023-01-24 08:23:27.285097: step: 1852/530, loss: 0.004234924912452698 2023-01-24 08:23:28.308101: step: 1856/530, loss: 0.0012708451831713319 2023-01-24 08:23:29.345005: step: 1860/530, loss: 0.00010736639524111524 2023-01-24 08:23:30.379815: step: 1864/530, loss: 0.00038453502929769456 2023-01-24 08:23:31.417767: step: 1868/530, loss: 0.00033335923217236996 2023-01-24 08:23:32.470712: step: 1872/530, loss: 0.01160730142146349 2023-01-24 08:23:33.520141: step: 1876/530, loss: 0.0037386224139481783 2023-01-24 08:23:34.551643: step: 1880/530, loss: 0.0007540821679867804 2023-01-24 08:23:35.597757: step: 1884/530, loss: 0.0008770199492573738 2023-01-24 08:23:36.636640: step: 1888/530, loss: 0.00011683989578159526 2023-01-24 08:23:37.670528: step: 1892/530, loss: 0.0030918132979422808 2023-01-24 08:23:38.701099: step: 1896/530, loss: 0.0007490574498660862 2023-01-24 08:23:39.744200: step: 1900/530, loss: 0.010304059833288193 2023-01-24 08:23:40.765334: step: 1904/530, loss: 7.208468014141545e-05 2023-01-24 08:23:41.807878: step: 1908/530, loss: 0.001376252039335668 2023-01-24 08:23:42.857119: step: 1912/530, loss: 0.003604793455451727 2023-01-24 08:23:43.900730: step: 1916/530, loss: 0.00017001554078888148 2023-01-24 08:23:44.934046: step: 1920/530, loss: 0.002414959715679288 2023-01-24 08:23:45.956848: step: 1924/530, loss: 0.0002481439441908151 2023-01-24 08:23:46.976659: step: 1928/530, loss: 0.0007361792959272861 2023-01-24 08:23:48.012042: step: 1932/530, loss: 0.009654955007135868 2023-01-24 08:23:49.052106: step: 1936/530, loss: 0.010741261765360832 2023-01-24 08:23:50.104051: step: 1940/530, loss: 0.005340594798326492 2023-01-24 08:23:51.138865: step: 1944/530, loss: 0.00021494003885891289 2023-01-24 08:23:52.171359: step: 1948/530, loss: 7.968128193169832e-05 2023-01-24 08:23:53.201871: step: 1952/530, loss: 0.00030087080085650086 2023-01-24 08:23:54.246577: step: 1956/530, loss: 4.224270742270164e-05 2023-01-24 08:23:55.303788: step: 1960/530, loss: 0.0006958569283597171 2023-01-24 08:23:56.370266: step: 1964/530, loss: 0.006141295190900564 2023-01-24 08:23:57.402103: step: 1968/530, loss: 0.0004534491163212806 2023-01-24 08:23:58.448921: step: 1972/530, loss: 0.001550563727505505 2023-01-24 08:23:59.471312: step: 1976/530, loss: 0.0028260506223887205 2023-01-24 08:24:00.507111: step: 1980/530, loss: 0.000257304054684937 2023-01-24 08:24:01.546664: step: 1984/530, loss: 0.0008961333660408854 2023-01-24 08:24:02.591626: step: 1988/530, loss: 0.0019929525442421436 2023-01-24 08:24:03.642250: step: 1992/530, loss: 0.0027199238538742065 2023-01-24 08:24:04.693648: step: 1996/530, loss: 0.0005656854482367635 2023-01-24 08:24:05.712942: step: 2000/530, loss: 0.0019591753371059895 2023-01-24 08:24:06.749506: step: 2004/530, loss: 0.001346637844108045 2023-01-24 08:24:07.775151: step: 2008/530, loss: 0.0040557608008384705 2023-01-24 08:24:08.818328: step: 2012/530, loss: 0.0010384107008576393 2023-01-24 08:24:09.877951: step: 2016/530, loss: 0.000618373800534755 2023-01-24 08:24:10.902979: step: 2020/530, loss: 0.004166426602751017 2023-01-24 08:24:11.937654: step: 2024/530, loss: 3.0647854146081954e-05 2023-01-24 08:24:12.984302: step: 2028/530, loss: 0.0025109269190579653 2023-01-24 08:24:14.026402: step: 2032/530, loss: 0.009793415665626526 2023-01-24 08:24:15.057709: step: 2036/530, loss: 0.0012217836920171976 2023-01-24 08:24:16.093048: step: 2040/530, loss: 0.013063976541161537 2023-01-24 08:24:17.138784: step: 2044/530, loss: 0.011299300007522106 2023-01-24 08:24:18.164017: step: 2048/530, loss: 0.0023629171773791313 2023-01-24 08:24:19.211463: step: 2052/530, loss: 4.836311563849449e-05 2023-01-24 08:24:20.254573: step: 2056/530, loss: 0.0007346873753704131 2023-01-24 08:24:21.301072: step: 2060/530, loss: 0.0003823303268291056 2023-01-24 08:24:22.344783: step: 2064/530, loss: 0.009841508232057095 2023-01-24 08:24:23.392368: step: 2068/530, loss: 0.005745592061430216 2023-01-24 08:24:24.458619: step: 2072/530, loss: 0.0028223213739693165 2023-01-24 08:24:25.504361: step: 2076/530, loss: 0.001286366255953908 2023-01-24 08:24:26.549067: step: 2080/530, loss: 0.005680242087692022 2023-01-24 08:24:27.600832: step: 2084/530, loss: 0.007327405735850334 2023-01-24 08:24:28.631712: step: 2088/530, loss: 0.002581064123660326 2023-01-24 08:24:29.693808: step: 2092/530, loss: 0.0060972184874117374 2023-01-24 08:24:30.738210: step: 2096/530, loss: 0.010546141304075718 2023-01-24 08:24:31.776744: step: 2100/530, loss: 0.003040348645299673 2023-01-24 08:24:32.818265: step: 2104/530, loss: 0.00012009617785224691 2023-01-24 08:24:33.882084: step: 2108/530, loss: 0.0007949028513394296 2023-01-24 08:24:34.920676: step: 2112/530, loss: 0.005056140013039112 2023-01-24 08:24:35.958075: step: 2116/530, loss: 0.005843624472618103 2023-01-24 08:24:37.019288: step: 2120/530, loss: 0.030014971271157265 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3716527777777778, 'r': 0.3173505692599621, 'f1': 0.34236182190378706}, 'combined': 0.25226660561331676, 'stategy': 1, 'epoch': 17} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3712566585803961, 'r': 0.38797685735837345, 'f1': 0.379432647915425}, 'combined': 0.29410568881482707, 'stategy': 1, 'epoch': 17} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3843719903691814, 'r': 0.3245645838980754, 'f1': 0.3519455467372134}, 'combined': 0.2593282975958414, 'stategy': 1, 'epoch': 17} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3711842857306252, 'r': 0.36777266545736575, 'f1': 0.3694706002009362}, 'combined': 0.2863839102035965, 'stategy': 1, 'epoch': 17} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3802940118053945, 'r': 0.3276157141549319, 'f1': 0.3519948651572867}, 'combined': 0.2593646374843165, 'stategy': 1, 'epoch': 17} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.35948126172869405, 'r': 0.3604724784430195, 'f1': 0.35997618774300616}, 'combined': 0.2790246048534306, 'stategy': 1, 'epoch': 17} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 17} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 17} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 17} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15} ****************************** Epoch: 18 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 08:27:01.413732: step: 4/530, loss: 0.0011004514526575804 2023-01-24 08:27:02.454244: step: 8/530, loss: 0.0015485460171476007 2023-01-24 08:27:03.519450: step: 12/530, loss: 0.004476394969969988 2023-01-24 08:27:04.551348: step: 16/530, loss: 0.0007204785943031311 2023-01-24 08:27:05.578326: step: 20/530, loss: 0.0021424717269837856 2023-01-24 08:27:06.608468: step: 24/530, loss: 0.0010343339527025819 2023-01-24 08:27:07.646419: step: 28/530, loss: 0.00013786889030598104 2023-01-24 08:27:08.685276: step: 32/530, loss: 0.0020042869728058577 2023-01-24 08:27:09.720690: step: 36/530, loss: 9.873901581158862e-05 2023-01-24 08:27:10.769699: step: 40/530, loss: 0.0003586667007766664 2023-01-24 08:27:11.807037: step: 44/530, loss: 0.0003571257402654737 2023-01-24 08:27:12.843592: step: 48/530, loss: 0.005025750026106834 2023-01-24 08:27:13.872227: step: 52/530, loss: 0.0014080420369282365 2023-01-24 08:27:14.924936: step: 56/530, loss: 0.0006306511932052672 2023-01-24 08:27:15.981293: step: 60/530, loss: 0.0035294953268021345 2023-01-24 08:27:17.010350: step: 64/530, loss: 0.0007785228081047535 2023-01-24 08:27:18.052589: step: 68/530, loss: 0.0005311129498295486 2023-01-24 08:27:19.111207: step: 72/530, loss: 6.244205724215135e-05 2023-01-24 08:27:20.144377: step: 76/530, loss: 0.0004511222941800952 2023-01-24 08:27:21.192932: step: 80/530, loss: 0.003255607094615698 2023-01-24 08:27:22.223463: step: 84/530, loss: 0.0001986724091693759 2023-01-24 08:27:23.269178: step: 88/530, loss: 0.00021972335525788367 2023-01-24 08:27:24.308985: step: 92/530, loss: 0.003665995318442583 2023-01-24 08:27:25.345124: step: 96/530, loss: 0.006084507331252098 2023-01-24 08:27:26.387771: step: 100/530, loss: 0.003251165384426713 2023-01-24 08:27:27.428545: step: 104/530, loss: 0.0005306070088408887 2023-01-24 08:27:28.476120: step: 108/530, loss: 0.0014637029962614179 2023-01-24 08:27:29.542711: step: 112/530, loss: 0.00017656983982305974 2023-01-24 08:27:30.582866: step: 116/530, loss: 0.005251055583357811 2023-01-24 08:27:31.623860: step: 120/530, loss: 0.0030476185493171215 2023-01-24 08:27:32.672112: step: 124/530, loss: 0.0013223965652287006 2023-01-24 08:27:33.714601: step: 128/530, loss: 0.003072301624342799 2023-01-24 08:27:34.746142: step: 132/530, loss: 0.0011979241389781237 2023-01-24 08:27:35.773900: step: 136/530, loss: 0.0 2023-01-24 08:27:36.807970: step: 140/530, loss: 0.0008933464996516705 2023-01-24 08:27:37.854454: step: 144/530, loss: 0.003278773743659258 2023-01-24 08:27:38.916075: step: 148/530, loss: 0.02431190386414528 2023-01-24 08:27:39.957506: step: 152/530, loss: 0.003205099841579795 2023-01-24 08:27:41.005945: step: 156/530, loss: 0.006427126005291939 2023-01-24 08:27:42.049700: step: 160/530, loss: 0.0006028419593349099 2023-01-24 08:27:43.090995: step: 164/530, loss: 0.0026085705030709505 2023-01-24 08:27:44.133434: step: 168/530, loss: 0.007286405190825462 2023-01-24 08:27:45.155992: step: 172/530, loss: 0.003637277288362384 2023-01-24 08:27:46.204034: step: 176/530, loss: 0.015096787363290787 2023-01-24 08:27:47.254916: step: 180/530, loss: 0.002204600954428315 2023-01-24 08:27:48.296889: step: 184/530, loss: 0.0010545180412009358 2023-01-24 08:27:49.337104: step: 188/530, loss: 0.00032845730311237276 2023-01-24 08:27:50.374963: step: 192/530, loss: 0.007657136768102646 2023-01-24 08:27:51.412839: step: 196/530, loss: 0.0009592468850314617 2023-01-24 08:27:52.456722: step: 200/530, loss: 0.0003860020078718662 2023-01-24 08:27:53.506565: step: 204/530, loss: 0.00011319531040498987 2023-01-24 08:27:54.549591: step: 208/530, loss: 0.002827430609613657 2023-01-24 08:27:55.605660: step: 212/530, loss: 0.001291204709559679 2023-01-24 08:27:56.637066: step: 216/530, loss: 0.006179413292557001 2023-01-24 08:27:57.680167: step: 220/530, loss: 0.0010054472368210554 2023-01-24 08:27:58.718912: step: 224/530, loss: 0.002646689536049962 2023-01-24 08:27:59.770052: step: 228/530, loss: 0.0005621419404633343 2023-01-24 08:28:00.813465: step: 232/530, loss: 0.007815116085112095 2023-01-24 08:28:01.852007: step: 236/530, loss: 0.02903848886489868 2023-01-24 08:28:02.891168: step: 240/530, loss: 3.8449732528533787e-05 2023-01-24 08:28:03.973652: step: 244/530, loss: 0.002362427767366171 2023-01-24 08:28:05.020102: step: 248/530, loss: 0.00012775677896570414 2023-01-24 08:28:06.054688: step: 252/530, loss: 0.0031440667808055878 2023-01-24 08:28:07.089472: step: 256/530, loss: 0.0001841807534219697 2023-01-24 08:28:08.124671: step: 260/530, loss: 0.0024066418409347534 2023-01-24 08:28:09.171037: step: 264/530, loss: 1.691768193268217e-05 2023-01-24 08:28:10.203039: step: 268/530, loss: 0.0007133395993150771 2023-01-24 08:28:11.265335: step: 272/530, loss: 0.0034632175229489803 2023-01-24 08:28:12.314902: step: 276/530, loss: 0.001298890681937337 2023-01-24 08:28:13.358212: step: 280/530, loss: 0.0002496509987395257 2023-01-24 08:28:14.458144: step: 284/530, loss: 0.001698222360573709 2023-01-24 08:28:15.524114: step: 288/530, loss: 1.8486880435375497e-05 2023-01-24 08:28:16.560132: step: 292/530, loss: 0.004569863434880972 2023-01-24 08:28:17.617769: step: 296/530, loss: 0.0034067442175000906 2023-01-24 08:28:18.671278: step: 300/530, loss: 0.0033893371000885963 2023-01-24 08:28:19.723999: step: 304/530, loss: 0.0003980577166657895 2023-01-24 08:28:20.776620: step: 308/530, loss: 0.0017462796531617641 2023-01-24 08:28:21.803766: step: 312/530, loss: 0.0014805826358497143 2023-01-24 08:28:22.857228: step: 316/530, loss: 0.003357308218255639 2023-01-24 08:28:23.910689: step: 320/530, loss: 0.0020128062460571527 2023-01-24 08:28:24.964255: step: 324/530, loss: 0.0026554614305496216 2023-01-24 08:28:26.017711: step: 328/530, loss: 0.00028746630414389074 2023-01-24 08:28:27.055993: step: 332/530, loss: 0.0010810262756422162 2023-01-24 08:28:28.109349: step: 336/530, loss: 0.003787329187616706 2023-01-24 08:28:29.128833: step: 340/530, loss: 0.00011475924111437052 2023-01-24 08:28:30.175507: step: 344/530, loss: 0.002529539866372943 2023-01-24 08:28:31.217838: step: 348/530, loss: 0.0013885658700019121 2023-01-24 08:28:32.271638: step: 352/530, loss: 0.00025244380231015384 2023-01-24 08:28:33.319624: step: 356/530, loss: 4.8076704842969775e-05 2023-01-24 08:28:34.362501: step: 360/530, loss: 5.0577531510498375e-05 2023-01-24 08:28:35.404427: step: 364/530, loss: 0.003146706148982048 2023-01-24 08:28:36.459685: step: 368/530, loss: 0.002765948185697198 2023-01-24 08:28:37.525211: step: 372/530, loss: 0.019216468557715416 2023-01-24 08:28:38.576015: step: 376/530, loss: 0.0019286295864731073 2023-01-24 08:28:39.618889: step: 380/530, loss: 0.020308448001742363 2023-01-24 08:28:40.657802: step: 384/530, loss: 0.0008033043704926968 2023-01-24 08:28:41.723163: step: 388/530, loss: 0.0004372689872980118 2023-01-24 08:28:42.773516: step: 392/530, loss: 0.0022435521241277456 2023-01-24 08:28:43.811947: step: 396/530, loss: 0.0028211530297994614 2023-01-24 08:28:44.863944: step: 400/530, loss: 0.0020552356727421284 2023-01-24 08:28:45.911075: step: 404/530, loss: 0.020023638382554054 2023-01-24 08:28:46.941413: step: 408/530, loss: 0.003318340750411153 2023-01-24 08:28:47.987157: step: 412/530, loss: 9.33839510253165e-06 2023-01-24 08:28:49.031612: step: 416/530, loss: 0.0015107261715456843 2023-01-24 08:28:50.080151: step: 420/530, loss: 0.0017514704959467053 2023-01-24 08:28:51.126608: step: 424/530, loss: 0.004567578434944153 2023-01-24 08:28:52.168472: step: 428/530, loss: 0.0007843594648875296 2023-01-24 08:28:53.212860: step: 432/530, loss: 1.6937028703978285e-05 2023-01-24 08:28:54.269078: step: 436/530, loss: 0.007142952643334866 2023-01-24 08:28:55.296898: step: 440/530, loss: 0.006755193695425987 2023-01-24 08:28:56.349788: step: 444/530, loss: 0.0008685367647558451 2023-01-24 08:28:57.384658: step: 448/530, loss: 6.131079862825572e-05 2023-01-24 08:28:58.446015: step: 452/530, loss: 0.0010961712105199695 2023-01-24 08:28:59.481916: step: 456/530, loss: 0.0023356121964752674 2023-01-24 08:29:00.516115: step: 460/530, loss: 0.004038605373352766 2023-01-24 08:29:01.562300: step: 464/530, loss: 9.342426346847787e-05 2023-01-24 08:29:02.609868: step: 468/530, loss: 0.0017812468577176332 2023-01-24 08:29:03.642623: step: 472/530, loss: 0.002060752362012863 2023-01-24 08:29:04.713406: step: 476/530, loss: 0.016233494505286217 2023-01-24 08:29:05.750240: step: 480/530, loss: 0.002346508903428912 2023-01-24 08:29:06.797167: step: 484/530, loss: 0.003929595462977886 2023-01-24 08:29:07.854319: step: 488/530, loss: 4.709040240413742e-06 2023-01-24 08:29:08.911303: step: 492/530, loss: 0.0031084208749234676 2023-01-24 08:29:09.973541: step: 496/530, loss: 0.0015573048731312156 2023-01-24 08:29:11.021142: step: 500/530, loss: 0.0 2023-01-24 08:29:12.060519: step: 504/530, loss: 0.010353624820709229 2023-01-24 08:29:13.101546: step: 508/530, loss: 0.0030232262797653675 2023-01-24 08:29:14.134450: step: 512/530, loss: 3.566694795154035e-05 2023-01-24 08:29:15.168363: step: 516/530, loss: 0.00011833704047603533 2023-01-24 08:29:16.204204: step: 520/530, loss: 0.00042011140612885356 2023-01-24 08:29:17.251536: step: 524/530, loss: 0.004647030029445887 2023-01-24 08:29:18.301672: step: 528/530, loss: 0.003184481291100383 2023-01-24 08:29:19.346848: step: 532/530, loss: 0.006225524935871363 2023-01-24 08:29:20.377548: step: 536/530, loss: 1.5952678950270638e-05 2023-01-24 08:29:21.425443: step: 540/530, loss: 0.0018279047217220068 2023-01-24 08:29:22.489052: step: 544/530, loss: 0.0007364078774116933 2023-01-24 08:29:23.518271: step: 548/530, loss: 0.0005492193740792572 2023-01-24 08:29:24.567833: step: 552/530, loss: 0.00013014712021686137 2023-01-24 08:29:25.599027: step: 556/530, loss: 0.0002371767332078889 2023-01-24 08:29:26.649753: step: 560/530, loss: 0.004101587459445 2023-01-24 08:29:27.696973: step: 564/530, loss: 0.0008924608118832111 2023-01-24 08:29:28.749245: step: 568/530, loss: 0.005209341645240784 2023-01-24 08:29:29.801939: step: 572/530, loss: 0.0003104804491158575 2023-01-24 08:29:30.848747: step: 576/530, loss: 0.001576914801262319 2023-01-24 08:29:31.898905: step: 580/530, loss: 0.012157829478383064 2023-01-24 08:29:32.941152: step: 584/530, loss: 0.0005354807362891734 2023-01-24 08:29:33.988933: step: 588/530, loss: 0.001497014076448977 2023-01-24 08:29:35.034529: step: 592/530, loss: 0.00017277183360420167 2023-01-24 08:29:36.075892: step: 596/530, loss: 0.00026166453608311713 2023-01-24 08:29:37.107739: step: 600/530, loss: 8.671941759530455e-05 2023-01-24 08:29:38.160441: step: 604/530, loss: 0.0006945659406483173 2023-01-24 08:29:39.205745: step: 608/530, loss: 0.0021995774004608393 2023-01-24 08:29:40.250395: step: 612/530, loss: 0.0015054685063660145 2023-01-24 08:29:41.287442: step: 616/530, loss: 0.004471979103982449 2023-01-24 08:29:42.336733: step: 620/530, loss: 0.0004085471446160227 2023-01-24 08:29:43.397842: step: 624/530, loss: 0.027030890807509422 2023-01-24 08:29:44.449549: step: 628/530, loss: 0.0006588977412320673 2023-01-24 08:29:45.495809: step: 632/530, loss: 0.001884608413092792 2023-01-24 08:29:46.532298: step: 636/530, loss: 0.0035075899213552475 2023-01-24 08:29:47.576088: step: 640/530, loss: 0.0033492667134851217 2023-01-24 08:29:48.606595: step: 644/530, loss: 9.604650404071435e-05 2023-01-24 08:29:49.642866: step: 648/530, loss: 0.0001633965439395979 2023-01-24 08:29:50.690990: step: 652/530, loss: 0.015823418274521828 2023-01-24 08:29:51.719086: step: 656/530, loss: 0.0025312898214906454 2023-01-24 08:29:52.782429: step: 660/530, loss: 0.0014884265838190913 2023-01-24 08:29:53.823354: step: 664/530, loss: 0.011327198706567287 2023-01-24 08:29:54.864796: step: 668/530, loss: 0.00017987831961363554 2023-01-24 08:29:55.908140: step: 672/530, loss: 0.001282813143916428 2023-01-24 08:29:56.950889: step: 676/530, loss: 0.0002611135132610798 2023-01-24 08:29:58.003407: step: 680/530, loss: 0.00012419302947819233 2023-01-24 08:29:59.043592: step: 684/530, loss: 0.00012041210720781237 2023-01-24 08:30:00.088850: step: 688/530, loss: 0.010376348160207272 2023-01-24 08:30:01.126373: step: 692/530, loss: 0.000801779911853373 2023-01-24 08:30:02.172112: step: 696/530, loss: 0.0016834231792017817 2023-01-24 08:30:03.225000: step: 700/530, loss: 6.791386840632185e-05 2023-01-24 08:30:04.251582: step: 704/530, loss: 0.0006431415094994009 2023-01-24 08:30:05.292894: step: 708/530, loss: 0.0027060690335929394 2023-01-24 08:30:06.340619: step: 712/530, loss: 0.0005142366862855852 2023-01-24 08:30:07.393382: step: 716/530, loss: 3.365147495060228e-05 2023-01-24 08:30:08.446120: step: 720/530, loss: 4.157410148764029e-05 2023-01-24 08:30:09.494633: step: 724/530, loss: 0.0019096104661002755 2023-01-24 08:30:10.531041: step: 728/530, loss: 0.005891962442547083 2023-01-24 08:30:11.568684: step: 732/530, loss: 0.004786570090800524 2023-01-24 08:30:12.610034: step: 736/530, loss: 0.0018507546046748757 2023-01-24 08:30:13.647034: step: 740/530, loss: 0.002836151747033 2023-01-24 08:30:14.699340: step: 744/530, loss: 9.455605322727934e-05 2023-01-24 08:30:15.738463: step: 748/530, loss: 0.0007701213471591473 2023-01-24 08:30:16.780812: step: 752/530, loss: 0.0030247115064412355 2023-01-24 08:30:17.837560: step: 756/530, loss: 0.00036444346187636256 2023-01-24 08:30:18.871689: step: 760/530, loss: 0.005743666086345911 2023-01-24 08:30:19.934301: step: 764/530, loss: 0.0004152635810896754 2023-01-24 08:30:20.964359: step: 768/530, loss: 0.000717329268809408 2023-01-24 08:30:21.994962: step: 772/530, loss: 0.005131026729941368 2023-01-24 08:30:23.034502: step: 776/530, loss: 0.004881407134234905 2023-01-24 08:30:24.068544: step: 780/530, loss: 0.0005614030524156988 2023-01-24 08:30:25.116702: step: 784/530, loss: 8.126455213641748e-05 2023-01-24 08:30:26.150605: step: 788/530, loss: 5.395114840212045e-06 2023-01-24 08:30:27.177919: step: 792/530, loss: 0.0017774271545931697 2023-01-24 08:30:28.224002: step: 796/530, loss: 0.0032857637852430344 2023-01-24 08:30:29.264897: step: 800/530, loss: 0.0011514577781781554 2023-01-24 08:30:30.311023: step: 804/530, loss: 0.004085666965693235 2023-01-24 08:30:31.367990: step: 808/530, loss: 0.0011021267855539918 2023-01-24 08:30:32.416090: step: 812/530, loss: 0.005500006955116987 2023-01-24 08:30:33.464781: step: 816/530, loss: 0.003999566659331322 2023-01-24 08:30:34.505900: step: 820/530, loss: 0.00016524360398761928 2023-01-24 08:30:35.536291: step: 824/530, loss: 3.676371488836594e-05 2023-01-24 08:30:36.614892: step: 828/530, loss: 0.0012608644319698215 2023-01-24 08:30:37.658040: step: 832/530, loss: 7.187816663645208e-05 2023-01-24 08:30:38.691884: step: 836/530, loss: 0.0 2023-01-24 08:30:39.732378: step: 840/530, loss: 0.027074512094259262 2023-01-24 08:30:40.793253: step: 844/530, loss: 0.00029827214893884957 2023-01-24 08:30:41.838280: step: 848/530, loss: 0.002746318932622671 2023-01-24 08:30:42.876322: step: 852/530, loss: 1.5612386050634086e-05 2023-01-24 08:30:43.912413: step: 856/530, loss: 0.00023588014300912619 2023-01-24 08:30:44.947879: step: 860/530, loss: 0.0009852091316133738 2023-01-24 08:30:45.985471: step: 864/530, loss: 0.0002751785214059055 2023-01-24 08:30:47.031521: step: 868/530, loss: 0.0048138173297047615 2023-01-24 08:30:48.072434: step: 872/530, loss: 0.00011382075899746269 2023-01-24 08:30:49.143057: step: 876/530, loss: 0.017650412395596504 2023-01-24 08:30:50.182184: step: 880/530, loss: 0.002988304477185011 2023-01-24 08:30:51.241114: step: 884/530, loss: 0.004262375645339489 2023-01-24 08:30:52.290644: step: 888/530, loss: 0.00027263202355243266 2023-01-24 08:30:53.340075: step: 892/530, loss: 5.511665949597955e-05 2023-01-24 08:30:54.384979: step: 896/530, loss: 0.0027193748392164707 2023-01-24 08:30:55.430644: step: 900/530, loss: 0.0068252175115048885 2023-01-24 08:30:56.466955: step: 904/530, loss: 0.020413950085639954 2023-01-24 08:30:57.504388: step: 908/530, loss: 3.381617716513574e-05 2023-01-24 08:30:58.541192: step: 912/530, loss: 0.0034264703281223774 2023-01-24 08:30:59.571495: step: 916/530, loss: 0.0005429537850432098 2023-01-24 08:31:00.598999: step: 920/530, loss: 0.004208940081298351 2023-01-24 08:31:01.632389: step: 924/530, loss: 0.005512853618711233 2023-01-24 08:31:02.667324: step: 928/530, loss: 0.002475880552083254 2023-01-24 08:31:03.703447: step: 932/530, loss: 0.001978884916752577 2023-01-24 08:31:04.742283: step: 936/530, loss: 5.936039428888762e-07 2023-01-24 08:31:05.766585: step: 940/530, loss: 0.002239610766991973 2023-01-24 08:31:06.795548: step: 944/530, loss: 0.0002142765006283298 2023-01-24 08:31:07.839956: step: 948/530, loss: 4.619327143018381e-08 2023-01-24 08:31:08.891304: step: 952/530, loss: 0.022329814732074738 2023-01-24 08:31:09.923045: step: 956/530, loss: 0.00011196551349712536 2023-01-24 08:31:10.974164: step: 960/530, loss: 0.022696807980537415 2023-01-24 08:31:12.005921: step: 964/530, loss: 0.0002388124557910487 2023-01-24 08:31:13.048240: step: 968/530, loss: 0.0027538160793483257 2023-01-24 08:31:14.110733: step: 972/530, loss: 0.012065545655786991 2023-01-24 08:31:15.144354: step: 976/530, loss: 3.42013081535697e-05 2023-01-24 08:31:16.189223: step: 980/530, loss: 6.307618605205789e-05 2023-01-24 08:31:17.228485: step: 984/530, loss: 0.0020277961157262325 2023-01-24 08:31:18.267430: step: 988/530, loss: 0.000552874116692692 2023-01-24 08:31:19.303890: step: 992/530, loss: 0.0049505983479321 2023-01-24 08:31:20.333798: step: 996/530, loss: 0.001882542739622295 2023-01-24 08:31:21.369993: step: 1000/530, loss: 0.0011978696566075087 2023-01-24 08:31:22.423565: step: 1004/530, loss: 0.0012127527734264731 2023-01-24 08:31:23.455995: step: 1008/530, loss: 0.0007783604087308049 2023-01-24 08:31:24.503508: step: 1012/530, loss: 0.002449911553412676 2023-01-24 08:31:25.539655: step: 1016/530, loss: 0.0762534812092781 2023-01-24 08:31:26.597082: step: 1020/530, loss: 0.0033033364452421665 2023-01-24 08:31:27.638882: step: 1024/530, loss: 6.077212219679495e-06 2023-01-24 08:31:28.683321: step: 1028/530, loss: 0.0016020482871681452 2023-01-24 08:31:29.716275: step: 1032/530, loss: 2.6438903660164215e-05 2023-01-24 08:31:30.755818: step: 1036/530, loss: 0.0029201656579971313 2023-01-24 08:31:31.792832: step: 1040/530, loss: 0.0055586895905435085 2023-01-24 08:31:32.830084: step: 1044/530, loss: 0.000632832758128643 2023-01-24 08:31:33.875772: step: 1048/530, loss: 0.0015257126651704311 2023-01-24 08:31:34.921039: step: 1052/530, loss: 0.0008503880235366523 2023-01-24 08:31:35.965041: step: 1056/530, loss: 0.0015724987024441361 2023-01-24 08:31:36.989772: step: 1060/530, loss: 1.4856231246085372e-05 2023-01-24 08:31:38.051962: step: 1064/530, loss: 6.583302456419915e-05 2023-01-24 08:31:39.086679: step: 1068/530, loss: 0.002436942420899868 2023-01-24 08:31:40.121741: step: 1072/530, loss: 0.00032046635169535875 2023-01-24 08:31:41.170688: step: 1076/530, loss: 0.00012110287207178771 2023-01-24 08:31:42.217242: step: 1080/530, loss: 0.002372728195041418 2023-01-24 08:31:43.271837: step: 1084/530, loss: 0.00012288035941310227 2023-01-24 08:31:44.316416: step: 1088/530, loss: 0.007364585995674133 2023-01-24 08:31:45.397374: step: 1092/530, loss: 3.62734826921951e-05 2023-01-24 08:31:46.442117: step: 1096/530, loss: 0.00015792572230566293 2023-01-24 08:31:47.477996: step: 1100/530, loss: 0.003984449431300163 2023-01-24 08:31:48.509897: step: 1104/530, loss: 0.0005640694871544838 2023-01-24 08:31:49.547608: step: 1108/530, loss: 5.598976349574514e-05 2023-01-24 08:31:50.602911: step: 1112/530, loss: 0.00042962294537574053 2023-01-24 08:31:51.638720: step: 1116/530, loss: 0.00016251549823209643 2023-01-24 08:31:52.705583: step: 1120/530, loss: 0.001281069708056748 2023-01-24 08:31:53.753934: step: 1124/530, loss: 0.005847966764122248 2023-01-24 08:31:54.784730: step: 1128/530, loss: 0.0019878402817994356 2023-01-24 08:31:55.843393: step: 1132/530, loss: 0.0025314881931990385 2023-01-24 08:31:56.891801: step: 1136/530, loss: 0.002351641422137618 2023-01-24 08:31:57.954226: step: 1140/530, loss: 0.0010337227722629905 2023-01-24 08:31:59.001302: step: 1144/530, loss: 0.0038619504775851965 2023-01-24 08:32:00.063491: step: 1148/530, loss: 0.0032300916500389576 2023-01-24 08:32:01.102898: step: 1152/530, loss: 0.0011425962438806891 2023-01-24 08:32:02.122625: step: 1156/530, loss: 0.001927337609231472 2023-01-24 08:32:03.152790: step: 1160/530, loss: 0.0006717698997817934 2023-01-24 08:32:04.204576: step: 1164/530, loss: 0.004957296419888735 2023-01-24 08:32:05.274964: step: 1168/530, loss: 0.003051629988476634 2023-01-24 08:32:06.321823: step: 1172/530, loss: 0.004967954475432634 2023-01-24 08:32:07.371371: step: 1176/530, loss: 0.003258374985307455 2023-01-24 08:32:08.441565: step: 1180/530, loss: 0.0009223743691109121 2023-01-24 08:32:09.475824: step: 1184/530, loss: 0.0003745995636563748 2023-01-24 08:32:10.509183: step: 1188/530, loss: 1.7748557468166837e-07 2023-01-24 08:32:11.549082: step: 1192/530, loss: 0.007866685278713703 2023-01-24 08:32:12.610929: step: 1196/530, loss: 0.000192342879017815 2023-01-24 08:32:13.673691: step: 1200/530, loss: 0.006477084942162037 2023-01-24 08:32:14.718884: step: 1204/530, loss: 0.0021790049504488707 2023-01-24 08:32:15.764185: step: 1208/530, loss: 0.002990493318066001 2023-01-24 08:32:16.813808: step: 1212/530, loss: 0.00032539491076022387 2023-01-24 08:32:17.865384: step: 1216/530, loss: 0.00024139491142705083 2023-01-24 08:32:18.940104: step: 1220/530, loss: 0.00062701350543648 2023-01-24 08:32:19.974556: step: 1224/530, loss: 3.0145847631501965e-05 2023-01-24 08:32:21.003360: step: 1228/530, loss: 0.0022818471770733595 2023-01-24 08:32:22.035180: step: 1232/530, loss: 0.00014814484165981412 2023-01-24 08:32:23.086934: step: 1236/530, loss: 0.0012805273290723562 2023-01-24 08:32:24.118286: step: 1240/530, loss: 0.00665692426264286 2023-01-24 08:32:25.155471: step: 1244/530, loss: 0.004849271383136511 2023-01-24 08:32:26.193868: step: 1248/530, loss: 0.001766684465110302 2023-01-24 08:32:27.249947: step: 1252/530, loss: 0.0010257732355967164 2023-01-24 08:32:28.286287: step: 1256/530, loss: 0.0001357453438686207 2023-01-24 08:32:29.308587: step: 1260/530, loss: 9.690555452834815e-05 2023-01-24 08:32:30.351676: step: 1264/530, loss: 0.0018626991659402847 2023-01-24 08:32:31.401765: step: 1268/530, loss: 4.063325468450785e-05 2023-01-24 08:32:32.445985: step: 1272/530, loss: 0.006159180775284767 2023-01-24 08:32:33.490051: step: 1276/530, loss: 0.042420193552970886 2023-01-24 08:32:34.536599: step: 1280/530, loss: 0.004204066004604101 2023-01-24 08:32:35.572836: step: 1284/530, loss: 0.0021976048592478037 2023-01-24 08:32:36.637038: step: 1288/530, loss: 6.468210631283e-05 2023-01-24 08:32:37.676916: step: 1292/530, loss: 0.00013075563765596598 2023-01-24 08:32:38.726445: step: 1296/530, loss: 0.0013294767122715712 2023-01-24 08:32:39.767031: step: 1300/530, loss: 0.0012069130316376686 2023-01-24 08:32:40.805874: step: 1304/530, loss: 0.003489164402708411 2023-01-24 08:32:41.848212: step: 1308/530, loss: 0.0019300506683066487 2023-01-24 08:32:42.894136: step: 1312/530, loss: 0.0025566101539880037 2023-01-24 08:32:43.936469: step: 1316/530, loss: 0.0035837392788380384 2023-01-24 08:32:44.961851: step: 1320/530, loss: 0.0004616178630385548 2023-01-24 08:32:45.993035: step: 1324/530, loss: 0.0003901587915606797 2023-01-24 08:32:47.043496: step: 1328/530, loss: 0.0015194857260212302 2023-01-24 08:32:48.079863: step: 1332/530, loss: 0.004413897171616554 2023-01-24 08:32:49.121236: step: 1336/530, loss: 4.1017559851752594e-05 2023-01-24 08:32:50.158495: step: 1340/530, loss: 0.004024730995297432 2023-01-24 08:32:51.214070: step: 1344/530, loss: 0.0012902431190013885 2023-01-24 08:32:52.261746: step: 1348/530, loss: 0.0027972920797765255 2023-01-24 08:32:53.299878: step: 1352/530, loss: 0.0007918868213891983 2023-01-24 08:32:54.354140: step: 1356/530, loss: 0.0005870192544534802 2023-01-24 08:32:55.393446: step: 1360/530, loss: 0.010433397255837917 2023-01-24 08:32:56.433494: step: 1364/530, loss: 0.0018087269272655249 2023-01-24 08:32:57.477351: step: 1368/530, loss: 0.001361538888886571 2023-01-24 08:32:58.518127: step: 1372/530, loss: 0.001256853574886918 2023-01-24 08:32:59.560357: step: 1376/530, loss: 0.001649790327064693 2023-01-24 08:33:00.611454: step: 1380/530, loss: 0.0021032148506492376 2023-01-24 08:33:01.657583: step: 1384/530, loss: 0.0005936964298598468 2023-01-24 08:33:02.706743: step: 1388/530, loss: 0.0005221807514317334 2023-01-24 08:33:03.787786: step: 1392/530, loss: 0.002304880181327462 2023-01-24 08:33:04.841070: step: 1396/530, loss: 0.005782202817499638 2023-01-24 08:33:05.903316: step: 1400/530, loss: 8.772419823799282e-05 2023-01-24 08:33:06.967494: step: 1404/530, loss: 0.0023764390498399734 2023-01-24 08:33:08.015416: step: 1408/530, loss: 0.004591720644384623 2023-01-24 08:33:09.050981: step: 1412/530, loss: 0.011562719009816647 2023-01-24 08:33:10.092653: step: 1416/530, loss: 9.731941827340052e-05 2023-01-24 08:33:11.141071: step: 1420/530, loss: 0.0044642239809036255 2023-01-24 08:33:12.168120: step: 1424/530, loss: 0.0024879854172468185 2023-01-24 08:33:13.201080: step: 1428/530, loss: 0.003250701352953911 2023-01-24 08:33:14.251644: step: 1432/530, loss: 0.006288027390837669 2023-01-24 08:33:15.295578: step: 1436/530, loss: 0.008314261212944984 2023-01-24 08:33:16.326875: step: 1440/530, loss: 0.003559113945811987 2023-01-24 08:33:17.363583: step: 1444/530, loss: 0.00010053793084807694 2023-01-24 08:33:18.390793: step: 1448/530, loss: 0.0019314768724143505 2023-01-24 08:33:19.424142: step: 1452/530, loss: 0.0005177659913897514 2023-01-24 08:33:20.472817: step: 1456/530, loss: 0.002462890697643161 2023-01-24 08:33:21.525065: step: 1460/530, loss: 0.00042663421481847763 2023-01-24 08:33:22.571893: step: 1464/530, loss: 0.004815227817744017 2023-01-24 08:33:23.601156: step: 1468/530, loss: 0.0014055515639483929 2023-01-24 08:33:24.641250: step: 1472/530, loss: 0.003134963335469365 2023-01-24 08:33:25.683612: step: 1476/530, loss: 0.004921565297991037 2023-01-24 08:33:26.738509: step: 1480/530, loss: 0.056693241000175476 2023-01-24 08:33:27.786109: step: 1484/530, loss: 3.8686055631842464e-05 2023-01-24 08:33:28.823400: step: 1488/530, loss: 0.0009435339597985148 2023-01-24 08:33:29.881101: step: 1492/530, loss: 0.0005153658566996455 2023-01-24 08:33:30.922701: step: 1496/530, loss: 3.112934427917935e-05 2023-01-24 08:33:31.970009: step: 1500/530, loss: 0.00027460220735520124 2023-01-24 08:33:33.005198: step: 1504/530, loss: 0.007785177789628506 2023-01-24 08:33:34.036244: step: 1508/530, loss: 0.0012664251262322068 2023-01-24 08:33:35.094646: step: 1512/530, loss: 0.0008438891964033246 2023-01-24 08:33:36.144073: step: 1516/530, loss: 0.008209994062781334 2023-01-24 08:33:37.201262: step: 1520/530, loss: 0.003996571060270071 2023-01-24 08:33:38.255053: step: 1524/530, loss: 1.397158939653309e-05 2023-01-24 08:33:39.294830: step: 1528/530, loss: 0.017526045441627502 2023-01-24 08:33:40.357275: step: 1532/530, loss: 3.1790787033969536e-05 2023-01-24 08:33:41.413516: step: 1536/530, loss: 0.0020459555089473724 2023-01-24 08:33:42.431873: step: 1540/530, loss: 0.001474827527999878 2023-01-24 08:33:43.482094: step: 1544/530, loss: 0.0005123792798258364 2023-01-24 08:33:44.537784: step: 1548/530, loss: 0.0005639170994982123 2023-01-24 08:33:45.577872: step: 1552/530, loss: 0.00745109049603343 2023-01-24 08:33:46.632261: step: 1556/530, loss: 0.00184642372187227 2023-01-24 08:33:47.688565: step: 1560/530, loss: 0.00014419754734262824 2023-01-24 08:33:48.737314: step: 1564/530, loss: 0.005999063607305288 2023-01-24 08:33:49.808506: step: 1568/530, loss: 0.00016644630522932857 2023-01-24 08:33:50.851134: step: 1572/530, loss: 3.279771044617519e-05 2023-01-24 08:33:51.897578: step: 1576/530, loss: 0.0014099200488999486 2023-01-24 08:33:52.949846: step: 1580/530, loss: 0.0031581914518028498 2023-01-24 08:33:54.001372: step: 1584/530, loss: 0.004766381345689297 2023-01-24 08:33:55.068198: step: 1588/530, loss: 0.0009192170691676438 2023-01-24 08:33:56.097080: step: 1592/530, loss: 8.551339851692319e-05 2023-01-24 08:33:57.131428: step: 1596/530, loss: 0.0020264198537915945 2023-01-24 08:33:58.167909: step: 1600/530, loss: 0.0021216089371591806 2023-01-24 08:33:59.210135: step: 1604/530, loss: 8.622062887297943e-05 2023-01-24 08:34:00.266517: step: 1608/530, loss: 0.0016236110823228955 2023-01-24 08:34:01.312807: step: 1612/530, loss: 5.186088674236089e-05 2023-01-24 08:34:02.360293: step: 1616/530, loss: 0.00019308857736177742 2023-01-24 08:34:03.416010: step: 1620/530, loss: 0.0006649705464951694 2023-01-24 08:34:04.472565: step: 1624/530, loss: 0.0007954604225233197 2023-01-24 08:34:05.530116: step: 1628/530, loss: 0.002592288190498948 2023-01-24 08:34:06.585488: step: 1632/530, loss: 4.619293576979544e-06 2023-01-24 08:34:07.633286: step: 1636/530, loss: 4.082791565451771e-05 2023-01-24 08:34:08.680241: step: 1640/530, loss: 0.0015390218468382955 2023-01-24 08:34:09.723030: step: 1644/530, loss: 0.001659642904996872 2023-01-24 08:34:10.774878: step: 1648/530, loss: 0.002143438206985593 2023-01-24 08:34:11.805995: step: 1652/530, loss: 0.0008224029443226755 2023-01-24 08:34:12.844967: step: 1656/530, loss: 0.004564713686704636 2023-01-24 08:34:13.893003: step: 1660/530, loss: 0.00493394723162055 2023-01-24 08:34:14.956546: step: 1664/530, loss: 0.0021117799915373325 2023-01-24 08:34:16.001468: step: 1668/530, loss: 0.00011618063581408933 2023-01-24 08:34:17.052427: step: 1672/530, loss: 0.00149440485984087 2023-01-24 08:34:18.107538: step: 1676/530, loss: 0.0038263064343482256 2023-01-24 08:34:19.157417: step: 1680/530, loss: 0.00539175420999527 2023-01-24 08:34:20.190316: step: 1684/530, loss: 0.008887311443686485 2023-01-24 08:34:21.215944: step: 1688/530, loss: 2.9132600047887536e-06 2023-01-24 08:34:22.268841: step: 1692/530, loss: 0.003699810244143009 2023-01-24 08:34:23.320846: step: 1696/530, loss: 5.02561579196481e-06 2023-01-24 08:34:24.350077: step: 1700/530, loss: 0.010473739355802536 2023-01-24 08:34:25.416071: step: 1704/530, loss: 0.0027329218573868275 2023-01-24 08:34:26.460611: step: 1708/530, loss: 0.00011836125486297533 2023-01-24 08:34:27.519073: step: 1712/530, loss: 0.035101570188999176 2023-01-24 08:34:28.560990: step: 1716/530, loss: 0.00040708636515773833 2023-01-24 08:34:29.600897: step: 1720/530, loss: 0.004286528564989567 2023-01-24 08:34:30.642014: step: 1724/530, loss: 0.004051835276186466 2023-01-24 08:34:31.675296: step: 1728/530, loss: 0.0030248307157307863 2023-01-24 08:34:32.726371: step: 1732/530, loss: 3.635800749179907e-05 2023-01-24 08:34:33.754626: step: 1736/530, loss: 0.0011479301610961556 2023-01-24 08:34:34.809643: step: 1740/530, loss: 0.004842640366405249 2023-01-24 08:34:35.835764: step: 1744/530, loss: 0.00036109256325289607 2023-01-24 08:34:36.865198: step: 1748/530, loss: 0.00037143705412745476 2023-01-24 08:34:37.908175: step: 1752/530, loss: 6.472118548117578e-05 2023-01-24 08:34:38.957149: step: 1756/530, loss: 0.0007849947432987392 2023-01-24 08:34:39.986548: step: 1760/530, loss: 8.931572665460408e-05 2023-01-24 08:34:41.033539: step: 1764/530, loss: 0.0060320147313177586 2023-01-24 08:34:42.087033: step: 1768/530, loss: 0.0016902574570849538 2023-01-24 08:34:43.107472: step: 1772/530, loss: 0.0012195459567010403 2023-01-24 08:34:44.140032: step: 1776/530, loss: 0.005039629060775042 2023-01-24 08:34:45.187887: step: 1780/530, loss: 0.0013716467656195164 2023-01-24 08:34:46.229934: step: 1784/530, loss: 0.00011016071221092716 2023-01-24 08:34:47.271220: step: 1788/530, loss: 1.3999451766721904e-05 2023-01-24 08:34:48.319463: step: 1792/530, loss: 0.0007266805623658001 2023-01-24 08:34:49.368073: step: 1796/530, loss: 0.003449204843491316 2023-01-24 08:34:50.392765: step: 1800/530, loss: 0.000335844699293375 2023-01-24 08:34:51.417683: step: 1804/530, loss: 0.0018640717025846243 2023-01-24 08:34:52.467543: step: 1808/530, loss: 0.00794154778122902 2023-01-24 08:34:53.496869: step: 1812/530, loss: 0.00024242194194812328 2023-01-24 08:34:54.536435: step: 1816/530, loss: 0.001151465461589396 2023-01-24 08:34:55.567573: step: 1820/530, loss: 0.017692919820547104 2023-01-24 08:34:56.621145: step: 1824/530, loss: 0.0011846307897940278 2023-01-24 08:34:57.662362: step: 1828/530, loss: 2.58858926827088e-06 2023-01-24 08:34:58.707063: step: 1832/530, loss: 0.0022339913994073868 2023-01-24 08:34:59.743063: step: 1836/530, loss: 0.013790315017104149 2023-01-24 08:35:00.778091: step: 1840/530, loss: 0.0008367117843590677 2023-01-24 08:35:01.820158: step: 1844/530, loss: 0.0022090678103268147 2023-01-24 08:35:02.847358: step: 1848/530, loss: 0.0011798989726230502 2023-01-24 08:35:03.885965: step: 1852/530, loss: 5.579032949754037e-05 2023-01-24 08:35:04.918632: step: 1856/530, loss: 1.1214691767236218e-05 2023-01-24 08:35:05.945218: step: 1860/530, loss: 0.0021004825830459595 2023-01-24 08:35:06.991582: step: 1864/530, loss: 0.0024329901207238436 2023-01-24 08:35:08.026075: step: 1868/530, loss: 0.00197086320258677 2023-01-24 08:35:09.074924: step: 1872/530, loss: 0.0037525813095271587 2023-01-24 08:35:10.107195: step: 1876/530, loss: 0.0024905495811253786 2023-01-24 08:35:11.151197: step: 1880/530, loss: 0.00043110395199619234 2023-01-24 08:35:12.191820: step: 1884/530, loss: 0.004796598106622696 2023-01-24 08:35:13.235507: step: 1888/530, loss: 0.000504016992636025 2023-01-24 08:35:14.266917: step: 1892/530, loss: 0.0006832245853729546 2023-01-24 08:35:15.314597: step: 1896/530, loss: 0.0025829202495515347 2023-01-24 08:35:16.354930: step: 1900/530, loss: 0.0009293968323618174 2023-01-24 08:35:17.384840: step: 1904/530, loss: 1.6700187188689597e-05 2023-01-24 08:35:18.431109: step: 1908/530, loss: 0.0074868230149149895 2023-01-24 08:35:19.485941: step: 1912/530, loss: 0.017092956230044365 2023-01-24 08:35:20.519790: step: 1916/530, loss: 0.0016801649471744895 2023-01-24 08:35:21.555340: step: 1920/530, loss: 0.0006731111207045615 2023-01-24 08:35:22.618544: step: 1924/530, loss: 0.01573982462286949 2023-01-24 08:35:23.655470: step: 1928/530, loss: 0.005498635116964579 2023-01-24 08:35:24.704098: step: 1932/530, loss: 0.0031591299921274185 2023-01-24 08:35:25.747745: step: 1936/530, loss: 0.002266906201839447 2023-01-24 08:35:26.802300: step: 1940/530, loss: 0.00015798679669387639 2023-01-24 08:35:27.844390: step: 1944/530, loss: 0.00024810314062051475 2023-01-24 08:35:28.885995: step: 1948/530, loss: 0.0012339941458776593 2023-01-24 08:35:29.924958: step: 1952/530, loss: 0.0024772698525339365 2023-01-24 08:35:30.964313: step: 1956/530, loss: 0.006872924044728279 2023-01-24 08:35:31.992217: step: 1960/530, loss: 0.0005999120767228305 2023-01-24 08:35:33.031625: step: 1964/530, loss: 0.0002524539886508137 2023-01-24 08:35:34.062946: step: 1968/530, loss: 0.004628421273082495 2023-01-24 08:35:35.094466: step: 1972/530, loss: 0.00041213203803636134 2023-01-24 08:35:36.150333: step: 1976/530, loss: 2.120855953080536e-07 2023-01-24 08:35:37.196099: step: 1980/530, loss: 1.5685640391893685e-05 2023-01-24 08:35:38.227915: step: 1984/530, loss: 0.000372269656509161 2023-01-24 08:35:39.267537: step: 1988/530, loss: 0.0003649625869002193 2023-01-24 08:35:40.326331: step: 1992/530, loss: 0.007205056492239237 2023-01-24 08:35:41.352972: step: 1996/530, loss: 0.006570196710526943 2023-01-24 08:35:42.394560: step: 2000/530, loss: 0.013084542006254196 2023-01-24 08:35:43.442935: step: 2004/530, loss: 0.007469133008271456 2023-01-24 08:35:44.471969: step: 2008/530, loss: 0.0 2023-01-24 08:35:45.500345: step: 2012/530, loss: 0.00013008693349547684 2023-01-24 08:35:46.544155: step: 2016/530, loss: 0.00021896997350268066 2023-01-24 08:35:47.609265: step: 2020/530, loss: 0.0021309363655745983 2023-01-24 08:35:48.654609: step: 2024/530, loss: 0.0029911391902714968 2023-01-24 08:35:49.702720: step: 2028/530, loss: 0.005834572017192841 2023-01-24 08:35:50.752384: step: 2032/530, loss: 0.004073398187756538 2023-01-24 08:35:51.789172: step: 2036/530, loss: 0.00503756757825613 2023-01-24 08:35:52.848419: step: 2040/530, loss: 0.0012076168786734343 2023-01-24 08:35:53.879328: step: 2044/530, loss: 1.8324577695238986e-06 2023-01-24 08:35:54.927121: step: 2048/530, loss: 0.0027322161477059126 2023-01-24 08:35:55.966956: step: 2052/530, loss: 0.001722295070067048 2023-01-24 08:35:56.994988: step: 2056/530, loss: 0.00016037047316785902 2023-01-24 08:35:58.024294: step: 2060/530, loss: 0.000477560271974653 2023-01-24 08:35:59.061955: step: 2064/530, loss: 0.001003615790978074 2023-01-24 08:36:00.112793: step: 2068/530, loss: 0.008078647777438164 2023-01-24 08:36:01.173509: step: 2072/530, loss: 0.003271593013778329 2023-01-24 08:36:02.202102: step: 2076/530, loss: 0.004478019196540117 2023-01-24 08:36:03.255700: step: 2080/530, loss: 0.006007687654346228 2023-01-24 08:36:04.315743: step: 2084/530, loss: 0.0033141088206321 2023-01-24 08:36:05.360600: step: 2088/530, loss: 0.004116765223443508 2023-01-24 08:36:06.413955: step: 2092/530, loss: 0.010699407197535038 2023-01-24 08:36:07.449118: step: 2096/530, loss: 0.0010037511819973588 2023-01-24 08:36:08.492986: step: 2100/530, loss: 0.0009823129512369633 2023-01-24 08:36:09.530014: step: 2104/530, loss: 0.0011538874823600054 2023-01-24 08:36:10.569181: step: 2108/530, loss: 0.0014359421329572797 2023-01-24 08:36:11.621597: step: 2112/530, loss: 0.01336933858692646 2023-01-24 08:36:12.671533: step: 2116/530, loss: 0.001752842334099114 2023-01-24 08:36:13.707868: step: 2120/530, loss: 3.47580571542494e-05 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3699861111111111, 'r': 0.3159274193548387, 'f1': 0.3408265097236438}, 'combined': 0.25113532295426383, 'stategy': 1, 'epoch': 18} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.378100107192467, 'r': 0.3916533279466088, 'f1': 0.384757400276217}, 'combined': 0.29823300882654147, 'stategy': 1, 'epoch': 18} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3906499680409077, 'r': 0.33134826511249665, 'f1': 0.3585637283660898}, 'combined': 0.2642048524802767, 'stategy': 1, 'epoch': 18} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3706004271287038, 'r': 0.36685354781030693, 'f1': 0.3687174688384424}, 'combined': 0.2858001433101803, 'stategy': 1, 'epoch': 18} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3796028038504357, 'r': 0.3291811790505676, 'f1': 0.3525985393488803}, 'combined': 0.2598094500465434, 'stategy': 1, 'epoch': 18} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36262125027281583, 'r': 0.361621375501843, 'f1': 0.362120622683852}, 'combined': 0.2806867984439427, 'stategy': 1, 'epoch': 18} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 18} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 18} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 18} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15} ****************************** Epoch: 19 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-24 08:38:39.327920: step: 4/530, loss: 0.005626446567475796 2023-01-24 08:38:40.372289: step: 8/530, loss: 0.00014369042764883488 2023-01-24 08:38:41.416679: step: 12/530, loss: 0.010451801121234894 2023-01-24 08:38:42.456093: step: 16/530, loss: 3.443231435085181e-06 2023-01-24 08:38:43.517438: step: 20/530, loss: 0.00022170107695274055 2023-01-24 08:38:44.559449: step: 24/530, loss: 0.001158897764980793 2023-01-24 08:38:45.608692: step: 28/530, loss: 0.0005250044632703066 2023-01-24 08:38:46.652229: step: 32/530, loss: 0.0002517616958357394 2023-01-24 08:38:47.702123: step: 36/530, loss: 0.00015325793356169015 2023-01-24 08:38:48.748388: step: 40/530, loss: 0.0004214466898702085 2023-01-24 08:38:49.791652: step: 44/530, loss: 5.444366252049804e-05 2023-01-24 08:38:50.867226: step: 48/530, loss: 0.0020414115861058235 2023-01-24 08:38:51.910385: step: 52/530, loss: 0.0015358494129031897 2023-01-24 08:38:52.947678: step: 56/530, loss: 0.0013440109323710203 2023-01-24 08:38:53.993450: step: 60/530, loss: 0.00280355429276824 2023-01-24 08:38:55.026708: step: 64/530, loss: 0.0018657094333320856 2023-01-24 08:38:56.063989: step: 68/530, loss: 0.002636269200593233 2023-01-24 08:38:57.107422: step: 72/530, loss: 0.003890024730935693 2023-01-24 08:38:58.166139: step: 76/530, loss: 6.129233224783093e-05 2023-01-24 08:38:59.203318: step: 80/530, loss: 6.516681605717167e-05 2023-01-24 08:39:00.257582: step: 84/530, loss: 0.00024245383974630386 2023-01-24 08:39:01.302343: step: 88/530, loss: 0.0038589711766690016 2023-01-24 08:39:02.349303: step: 92/530, loss: 0.002299490850418806 2023-01-24 08:39:03.383847: step: 96/530, loss: 9.911660526995547e-06 2023-01-24 08:39:04.422785: step: 100/530, loss: 0.00015212695871014148 2023-01-24 08:39:05.459554: step: 104/530, loss: 0.0030536558479070663 2023-01-24 08:39:06.498775: step: 108/530, loss: 0.0023492123000323772 2023-01-24 08:39:07.549650: step: 112/530, loss: 0.003406766103580594 2023-01-24 08:39:08.596121: step: 116/530, loss: 0.0026423195376992226 2023-01-24 08:39:09.650741: step: 120/530, loss: 0.00137248111423105 2023-01-24 08:39:10.679357: step: 124/530, loss: 0.001738875056616962 2023-01-24 08:39:11.727665: step: 128/530, loss: 0.0015760643873363733 2023-01-24 08:39:12.771856: step: 132/530, loss: 0.0004440586781129241 2023-01-24 08:39:13.821883: step: 136/530, loss: 0.0036454659420996904 2023-01-24 08:39:14.863926: step: 140/530, loss: 0.0005197924911044538 2023-01-24 08:39:15.908846: step: 144/530, loss: 0.013064837083220482 2023-01-24 08:39:16.944841: step: 148/530, loss: 0.004167779814451933 2023-01-24 08:39:17.990218: step: 152/530, loss: 0.00935199111700058 2023-01-24 08:39:19.045166: step: 156/530, loss: 0.006484498269855976 2023-01-24 08:39:20.085792: step: 160/530, loss: 0.025635844096541405 2023-01-24 08:39:21.118162: step: 164/530, loss: 1.6109053149193642e-06 2023-01-24 08:39:22.153273: step: 168/530, loss: 1.649110345169902e-05 2023-01-24 08:39:23.197191: step: 172/530, loss: 0.004525516647845507 2023-01-24 08:39:24.240305: step: 176/530, loss: 0.007596456445753574 2023-01-24 08:39:25.282430: step: 180/530, loss: 0.0022685991134494543 2023-01-24 08:39:26.322919: step: 184/530, loss: 0.000429784064181149 2023-01-24 08:39:27.347575: step: 188/530, loss: 0.0015707494458183646 2023-01-24 08:39:28.388928: step: 192/530, loss: 0.003487711539492011 2023-01-24 08:39:29.419448: step: 196/530, loss: 0.00016858085291460156 2023-01-24 08:39:30.463277: step: 200/530, loss: 0.010343965142965317 2023-01-24 08:39:31.511897: step: 204/530, loss: 0.001973228296265006 2023-01-24 08:39:32.556278: step: 208/530, loss: 0.0 2023-01-24 08:39:33.616366: step: 212/530, loss: 0.006910588126629591 2023-01-24 08:39:34.661116: step: 216/530, loss: 1.8952407117467374e-05 2023-01-24 08:39:35.709412: step: 220/530, loss: 0.00035080115776509047 2023-01-24 08:39:36.761689: step: 224/530, loss: 0.001980482367798686 2023-01-24 08:39:37.797990: step: 228/530, loss: 5.317779505276121e-05 2023-01-24 08:39:38.838471: step: 232/530, loss: 0.004836398642510176 2023-01-24 08:39:39.885272: step: 236/530, loss: 0.0056937807239592075 2023-01-24 08:39:40.924260: step: 240/530, loss: 0.002523608971387148 2023-01-24 08:39:41.972348: step: 244/530, loss: 0.00043353429646231234 2023-01-24 08:39:43.021890: step: 248/530, loss: 6.026616716781064e-08 2023-01-24 08:39:44.048936: step: 252/530, loss: 0.0026329131796956062 2023-01-24 08:39:45.088881: step: 256/530, loss: 0.00041145726572722197 2023-01-24 08:39:46.138917: step: 260/530, loss: 0.0027066851034760475 2023-01-24 08:39:47.182895: step: 264/530, loss: 0.00023460002557840198 2023-01-24 08:39:48.233022: step: 268/530, loss: 0.002958378056064248 2023-01-24 08:39:49.265494: step: 272/530, loss: 2.5870322133414447e-05 2023-01-24 08:39:50.339532: step: 276/530, loss: 0.008892868645489216 2023-01-24 08:39:51.391571: step: 280/530, loss: 9.65287399594672e-05 2023-01-24 08:39:52.430943: step: 284/530, loss: 0.0010161735117435455 2023-01-24 08:39:53.473573: step: 288/530, loss: 0.0008460739045403898 2023-01-24 08:39:54.504095: step: 292/530, loss: 0.006211341358721256 2023-01-24 08:39:55.545295: step: 296/530, loss: 0.005600426346063614 2023-01-24 08:39:56.607919: step: 300/530, loss: 1.3914585679231095e-06 2023-01-24 08:39:57.659666: step: 304/530, loss: 0.0029889405705034733 2023-01-24 08:39:58.702257: step: 308/530, loss: 3.432559196880902e-07 2023-01-24 08:39:59.741332: step: 312/530, loss: 6.819624900344934e-07 2023-01-24 08:40:00.775200: step: 316/530, loss: 1.9061630155192688e-05 2023-01-24 08:40:01.848357: step: 320/530, loss: 0.002788847777992487 2023-01-24 08:40:02.890713: step: 324/530, loss: 0.00019209779566153884 2023-01-24 08:40:03.953660: step: 328/530, loss: 6.264240073505789e-05 2023-01-24 08:40:05.012417: step: 332/530, loss: 0.005913532339036465 2023-01-24 08:40:06.043040: step: 336/530, loss: 2.0686725292762276e-06 2023-01-24 08:40:07.087656: step: 340/530, loss: 0.0016512090805917978 2023-01-24 08:40:08.129611: step: 344/530, loss: 0.00014736366574652493 2023-01-24 08:40:09.177391: step: 348/530, loss: 0.0013936960604041815 2023-01-24 08:40:10.234918: step: 352/530, loss: 0.00015973685367498547 2023-01-24 08:40:11.274412: step: 356/530, loss: 0.0017561035929247737 2023-01-24 08:40:12.311188: step: 360/530, loss: 0.0007700967253185809 2023-01-24 08:40:13.364865: step: 364/530, loss: 0.005132708232849836 2023-01-24 08:40:14.408829: step: 368/530, loss: 0.0008344475063495338 2023-01-24 08:40:15.444639: step: 372/530, loss: 0.0010486284736543894 2023-01-24 08:40:16.495186: step: 376/530, loss: 2.4150840545189567e-05 2023-01-24 08:40:17.540602: step: 380/530, loss: 0.0018868526676669717 2023-01-24 08:40:18.588646: step: 384/530, loss: 0.0005680397152900696 2023-01-24 08:40:19.625406: step: 388/530, loss: 0.0001443260844098404 2023-01-24 08:40:20.667711: step: 392/530, loss: 0.00017575845413375646 2023-01-24 08:40:21.707792: step: 396/530, loss: 0.005213476717472076 2023-01-24 08:40:22.751380: step: 400/530, loss: 0.0011082661803811789 2023-01-24 08:40:23.785896: step: 404/530, loss: 0.003028241917490959 2023-01-24 08:40:24.826632: step: 408/530, loss: 0.0023756646551191807 2023-01-24 08:40:25.873987: step: 412/530, loss: 0.00290953298099339 2023-01-24 08:40:26.923606: step: 416/530, loss: 3.7953264836687595e-05 2023-01-24 08:40:27.971598: step: 420/530, loss: 0.013020087033510208 2023-01-24 08:40:29.021756: step: 424/530, loss: 0.00021397035743575543 2023-01-24 08:40:30.059511: step: 428/530, loss: 9.09421214601025e-06 2023-01-24 08:40:31.094651: step: 432/530, loss: 0.004044977482408285 2023-01-24 08:40:32.159959: step: 436/530, loss: 0.000284249079413712 2023-01-24 08:40:33.236824: step: 440/530, loss: 0.0008995109819807112 2023-01-24 08:40:34.291358: step: 444/530, loss: 0.0006774552166461945 2023-01-24 08:40:35.333132: step: 448/530, loss: 0.000935703341383487 2023-01-24 08:40:36.380524: step: 452/530, loss: 0.004483042284846306 2023-01-24 08:40:37.426966: step: 456/530, loss: 0.00899346824735403 2023-01-24 08:40:38.482717: step: 460/530, loss: 1.3523878806154244e-05 2023-01-24 08:40:39.524390: step: 464/530, loss: 0.0031942466739565134 2023-01-24 08:40:40.574604: step: 468/530, loss: 0.00030736022745259106 2023-01-24 08:40:41.597785: step: 472/530, loss: 0.00269091734662652 2023-01-24 08:40:42.641142: step: 476/530, loss: 0.0034265455324202776 2023-01-24 08:40:43.684512: step: 480/530, loss: 0.004724216181784868 2023-01-24 08:40:44.736465: step: 484/530, loss: 0.0055031911469995975 2023-01-24 08:40:45.792445: step: 488/530, loss: 0.004729169420897961 2023-01-24 08:40:46.844347: step: 492/530, loss: 0.005532048176974058 2023-01-24 08:40:47.892486: step: 496/530, loss: 1.925692595250439e-05 2023-01-24 08:40:48.941334: step: 500/530, loss: 0.0018275126349180937 2023-01-24 08:40:49.992780: step: 504/530, loss: 0.0008080166298896074 2023-01-24 08:40:51.044498: step: 508/530, loss: 0.0010295987594872713 2023-01-24 08:40:52.085013: step: 512/530, loss: 0.0007535787299275398 2023-01-24 08:40:53.140381: step: 516/530, loss: 0.00426517566666007 2023-01-24 08:40:54.180878: step: 520/530, loss: 0.0005689088138751686 2023-01-24 08:40:55.230468: step: 524/530, loss: 0.0015364977298304439 2023-01-24 08:40:56.263775: step: 528/530, loss: 0.0021460126154124737 2023-01-24 08:40:57.302357: step: 532/530, loss: 0.0008248817175626755 2023-01-24 08:40:58.361569: step: 536/530, loss: 0.0001414690923411399 2023-01-24 08:40:59.393556: step: 540/530, loss: 0.0011817824561148882 2023-01-24 08:41:00.444495: step: 544/530, loss: 0.0007488696137443185 2023-01-24 08:41:01.504350: step: 548/530, loss: 0.003530869958922267 2023-01-24 08:41:02.558536: step: 552/530, loss: 0.00010069393465528265 2023-01-24 08:41:03.616728: step: 556/530, loss: 3.1637435427001037e-07 2023-01-24 08:41:04.656471: step: 560/530, loss: 2.0649536963901483e-05 2023-01-24 08:41:05.691601: step: 564/530, loss: 0.000263277324847877 2023-01-24 08:41:06.742370: step: 568/530, loss: 0.0031225415877997875 2023-01-24 08:41:07.795997: step: 572/530, loss: 0.0017694475827738643 2023-01-24 08:41:08.844438: step: 576/530, loss: 8.599702414358035e-05 2023-01-24 08:41:09.897169: step: 580/530, loss: 0.0014183823950588703 2023-01-24 08:41:10.938849: step: 584/530, loss: 0.0019364558393135667 2023-01-24 08:41:11.988108: step: 588/530, loss: 0.002726313890889287 2023-01-24 08:41:13.036071: step: 592/530, loss: 0.008177314884960651 2023-01-24 08:41:14.071016: step: 596/530, loss: 0.0003128675161860883 2023-01-24 08:41:15.133993: step: 600/530, loss: 0.00030083622550591826 2023-01-24 08:41:16.199291: step: 604/530, loss: 0.00013375611160881817 2023-01-24 08:41:17.235564: step: 608/530, loss: 0.00041740009328350425 2023-01-24 08:41:18.279872: step: 612/530, loss: 0.0022147924173623323 2023-01-24 08:41:19.344702: step: 616/530, loss: 0.001118602929636836 2023-01-24 08:41:20.383056: step: 620/530, loss: 4.026249735034071e-05 2023-01-24 08:41:21.432847: step: 624/530, loss: 0.0009214036981575191 2023-01-24 08:41:22.498013: step: 628/530, loss: 0.0006902736495248973 2023-01-24 08:41:23.528672: step: 632/530, loss: 0.005331212654709816 2023-01-24 08:41:24.573347: step: 636/530, loss: 0.005170522257685661 2023-01-24 08:41:25.618282: step: 640/530, loss: 0.0009643434314057231 2023-01-24 08:41:26.659653: step: 644/530, loss: 1.0169541383220349e-05 2023-01-24 08:41:27.712201: step: 648/530, loss: 0.002622185042127967 2023-01-24 08:41:28.744762: step: 652/530, loss: 0.001706407405436039 2023-01-24 08:41:29.781380: step: 656/530, loss: 0.0002552588121034205 2023-01-24 08:41:30.837136: step: 660/530, loss: 0.0011450779857113957 2023-01-24 08:41:31.868129: step: 664/530, loss: 0.0007268712506629527 2023-01-24 08:41:32.927413: step: 668/530, loss: 8.73974640853703e-05 2023-01-24 08:41:33.976685: step: 672/530, loss: 0.0011688433587551117 2023-01-24 08:41:35.073283: step: 676/530, loss: 0.001862452831119299 2023-01-24 08:41:36.120937: step: 680/530, loss: 0.0006581024499610066 2023-01-24 08:41:37.158891: step: 684/530, loss: 0.008058595471084118 2023-01-24 08:41:38.196883: step: 688/530, loss: 0.0001351031387457624 2023-01-24 08:41:39.241066: step: 692/530, loss: 0.0024865635205060244 2023-01-24 08:41:40.306411: step: 696/530, loss: 1.6259475160040893e-05 2023-01-24 08:41:41.332918: step: 700/530, loss: 0.0016584255499765277 2023-01-24 08:41:42.377070: step: 704/530, loss: 1.6649722965667024e-05 2023-01-24 08:41:43.421778: step: 708/530, loss: 0.0019168462604284286 2023-01-24 08:41:44.470246: step: 712/530, loss: 4.232570790918544e-05 2023-01-24 08:41:45.508146: step: 716/530, loss: 0.0002777922782115638 2023-01-24 08:41:46.556068: step: 720/530, loss: 0.0002649379603099078 2023-01-24 08:41:47.593977: step: 724/530, loss: 0.0010126122506335378 2023-01-24 08:41:48.639349: step: 728/530, loss: 3.378981273272075e-05 2023-01-24 08:41:49.687402: step: 732/530, loss: 0.009026461280882359 2023-01-24 08:41:50.732346: step: 736/530, loss: 0.0019466986414045095 2023-01-24 08:41:51.781405: step: 740/530, loss: 0.0003420878201723099 2023-01-24 08:41:52.827044: step: 744/530, loss: 0.00219076219946146 2023-01-24 08:41:53.863157: step: 748/530, loss: 8.032878395169973e-05 2023-01-24 08:41:54.895183: step: 752/530, loss: 0.00026065041311085224 2023-01-24 08:41:55.951633: step: 756/530, loss: 0.0050124977715313435 2023-01-24 08:41:57.013955: step: 760/530, loss: 0.0017083699349313974 2023-01-24 08:41:58.058540: step: 764/530, loss: 0.0024439250119030476 2023-01-24 08:41:59.099700: step: 768/530, loss: 0.0020100956317037344 2023-01-24 08:42:00.136693: step: 772/530, loss: 2.3693635739618912e-05 2023-01-24 08:42:01.199662: step: 776/530, loss: 0.000990989850834012 2023-01-24 08:42:02.252102: step: 780/530, loss: 8.82792937773047e-06 2023-01-24 08:42:03.282471: step: 784/530, loss: 0.006131125148385763 2023-01-24 08:42:04.332999: step: 788/530, loss: 0.0003794836811721325 2023-01-24 08:42:05.388264: step: 792/530, loss: 0.0008318485924974084 2023-01-24 08:42:06.430669: step: 796/530, loss: 0.0004544957191683352 2023-01-24 08:42:07.464409: step: 800/530, loss: 0.00012144893844379112 2023-01-24 08:42:08.509292: step: 804/530, loss: 0.0013561670202761889 2023-01-24 08:42:09.551829: step: 808/530, loss: 0.0019005938665941358 2023-01-24 08:42:10.587666: step: 812/530, loss: 0.0024295980110764503 2023-01-24 08:42:11.631805: step: 816/530, loss: 0.0023929672315716743 2023-01-24 08:42:12.679183: step: 820/530, loss: 0.0005442625842988491 2023-01-24 08:42:13.717209: step: 824/530, loss: 0.005113847553730011 2023-01-24 08:42:14.759626: step: 828/530, loss: 0.00027917444822378457 2023-01-24 08:42:15.797609: step: 832/530, loss: 0.0007879415643401444 2023-01-24 08:42:16.845504: step: 836/530, loss: 0.0010107087437063456 2023-01-24 08:42:17.903616: step: 840/530, loss: 0.0006676812190562487 2023-01-24 08:42:18.955188: step: 844/530, loss: 0.0002876889775507152 2023-01-24 08:42:19.986768: step: 848/530, loss: 0.0011974034132435918 2023-01-24 08:42:21.042752: step: 852/530, loss: 0.0017826578114181757 2023-01-24 08:42:22.101154: step: 856/530, loss: 0.0002193367254221812 2023-01-24 08:42:23.146800: step: 860/530, loss: 0.002746338490396738 2023-01-24 08:42:24.188605: step: 864/530, loss: 0.003912175539880991 2023-01-24 08:42:25.236224: step: 868/530, loss: 2.355910328333266e-05 2023-01-24 08:42:26.275433: step: 872/530, loss: 0.005852560047060251 2023-01-24 08:42:27.307744: step: 876/530, loss: 2.7279505957267247e-05 2023-01-24 08:42:28.346709: step: 880/530, loss: 0.006939339451491833 2023-01-24 08:42:29.387767: step: 884/530, loss: 9.038711141329259e-06 2023-01-24 08:42:30.438736: step: 888/530, loss: 0.008145336993038654 2023-01-24 08:42:31.480413: step: 892/530, loss: 0.0004597233491949737 2023-01-24 08:42:32.528557: step: 896/530, loss: 0.00010788706276798621 2023-01-24 08:42:33.568104: step: 900/530, loss: 0.0011391089065000415 2023-01-24 08:42:34.609898: step: 904/530, loss: 0.006249002646654844 2023-01-24 08:42:35.642775: step: 908/530, loss: 0.00013312860392034054 2023-01-24 08:42:36.687000: step: 912/530, loss: 1.7742576119417208e-06 2023-01-24 08:42:37.730004: step: 916/530, loss: 3.2327850476576714e-06 2023-01-24 08:42:38.764841: step: 920/530, loss: 0.014845973812043667 2023-01-24 08:42:39.793404: step: 924/530, loss: 8.19013348518638e-06 2023-01-24 08:42:40.843121: step: 928/530, loss: 0.0017061250982806087 2023-01-24 08:42:41.888134: step: 932/530, loss: 0.0003770788316614926 2023-01-24 08:42:42.927949: step: 936/530, loss: 0.0002954646770376712 2023-01-24 08:42:43.986359: step: 940/530, loss: 0.0008622297318652272 2023-01-24 08:42:45.044381: step: 944/530, loss: 0.0012343886774033308 2023-01-24 08:42:46.091488: step: 948/530, loss: 0.0010636313818395138 2023-01-24 08:42:47.137135: step: 952/530, loss: 1.2405379493429791e-05 2023-01-24 08:42:48.181602: step: 956/530, loss: 0.0007470149430446327 2023-01-24 08:42:49.228877: step: 960/530, loss: 0.001472724019549787 2023-01-24 08:42:50.280894: step: 964/530, loss: 0.0018367304001003504 2023-01-24 08:42:51.326210: step: 968/530, loss: 0.003949539735913277 2023-01-24 08:42:52.383081: step: 972/530, loss: 0.003995168022811413 2023-01-24 08:42:53.422374: step: 976/530, loss: 0.00022083039220888168 2023-01-24 08:42:54.465811: step: 980/530, loss: 0.002190894214436412 2023-01-24 08:42:55.505821: step: 984/530, loss: 3.09558272419963e-05 2023-01-24 08:42:56.558946: step: 988/530, loss: 0.0006759811658412218 2023-01-24 08:42:57.592959: step: 992/530, loss: 0.003623665077611804 2023-01-24 08:42:58.639533: step: 996/530, loss: 0.0014246400678530335 2023-01-24 08:42:59.674269: step: 1000/530, loss: 0.0017691166140139103 2023-01-24 08:43:00.710786: step: 1004/530, loss: 0.0010221840348094702 2023-01-24 08:43:01.772634: step: 1008/530, loss: 0.0018256825860589743 2023-01-24 08:43:02.827158: step: 1012/530, loss: 0.00019149246509186924 2023-01-24 08:43:03.877205: step: 1016/530, loss: 0.00151846616063267 2023-01-24 08:43:04.917517: step: 1020/530, loss: 0.00743184145539999 2023-01-24 08:43:05.975445: step: 1024/530, loss: 0.010206153616309166 2023-01-24 08:43:07.020581: step: 1028/530, loss: 7.514876779168844e-05 2023-01-24 08:43:08.068033: step: 1032/530, loss: 0.002149930689483881 2023-01-24 08:43:09.114579: step: 1036/530, loss: 0.0023523711133748293 2023-01-24 08:43:10.144677: step: 1040/530, loss: 0.000745853059925139 2023-01-24 08:43:11.183303: step: 1044/530, loss: 0.0012126355431973934 2023-01-24 08:43:12.241085: step: 1048/530, loss: 0.0017065427964553237 2023-01-24 08:43:13.286241: step: 1052/530, loss: 5.352330481400713e-05 2023-01-24 08:43:14.339771: step: 1056/530, loss: 0.003741718828678131 2023-01-24 08:43:15.366899: step: 1060/530, loss: 0.00025653469492681324 2023-01-24 08:43:16.418314: step: 1064/530, loss: 0.003100144909694791 2023-01-24 08:43:17.453118: step: 1068/530, loss: 0.00930363405495882 2023-01-24 08:43:18.495288: step: 1072/530, loss: 0.0038777559529989958 2023-01-24 08:43:19.527995: step: 1076/530, loss: 0.004641006235033274 2023-01-24 08:43:20.572114: step: 1080/530, loss: 0.0009079177980311215 2023-01-24 08:43:21.617007: step: 1084/530, loss: 0.004109915345907211 2023-01-24 08:43:22.664419: step: 1088/530, loss: 0.00040428826468996704 2023-01-24 08:43:23.720863: step: 1092/530, loss: 1.1030459063476883e-05 2023-01-24 08:43:24.746491: step: 1096/530, loss: 0.007341318763792515 2023-01-24 08:43:25.791026: step: 1100/530, loss: 0.003847693093121052 2023-01-24 08:43:26.835678: step: 1104/530, loss: 0.0004101607482880354 2023-01-24 08:43:27.885801: step: 1108/530, loss: 0.01341897714883089 2023-01-24 08:43:28.956300: step: 1112/530, loss: 0.024929696694016457 2023-01-24 08:43:30.003049: step: 1116/530, loss: 0.008607692085206509 2023-01-24 08:43:31.073886: step: 1120/530, loss: 0.001027898513711989 2023-01-24 08:43:32.110317: step: 1124/530, loss: 0.0032819602638483047 2023-01-24 08:43:33.154384: step: 1128/530, loss: 0.002644893480464816 2023-01-24 08:43:34.202514: step: 1132/530, loss: 0.0008560423157177866 2023-01-24 08:43:35.261248: step: 1136/530, loss: 0.006139503791928291 2023-01-24 08:43:36.308817: step: 1140/530, loss: 0.0020366166718304157 2023-01-24 08:43:37.336200: step: 1144/530, loss: 0.002872372744604945 2023-01-24 08:43:38.371507: step: 1148/530, loss: 0.00046451052185148 2023-01-24 08:43:39.418999: step: 1152/530, loss: 0.0019574458710849285 2023-01-24 08:43:40.450923: step: 1156/530, loss: 0.0006437331321649253 2023-01-24 08:43:41.481651: step: 1160/530, loss: 2.329449671378825e-05 2023-01-24 08:43:42.539840: step: 1164/530, loss: 0.0019324080785736442 2023-01-24 08:43:43.577261: step: 1168/530, loss: 0.011647249571979046 2023-01-24 08:43:44.620814: step: 1172/530, loss: 0.000496596738230437 2023-01-24 08:43:45.663977: step: 1176/530, loss: 0.0005437369109131396 2023-01-24 08:43:46.704994: step: 1180/530, loss: 0.01833151839673519 2023-01-24 08:43:47.746660: step: 1184/530, loss: 0.010786481201648712 2023-01-24 08:43:48.785874: step: 1188/530, loss: 0.0006603167857974768 2023-01-24 08:43:49.823629: step: 1192/530, loss: 7.851884583942592e-05 2023-01-24 08:43:50.861662: step: 1196/530, loss: 0.0007735260878689587 2023-01-24 08:43:51.905464: step: 1200/530, loss: 2.752328555288841e-06 2023-01-24 08:43:52.933963: step: 1204/530, loss: 0.00020667779608629644 2023-01-24 08:43:53.960653: step: 1208/530, loss: 0.003709016367793083 2023-01-24 08:43:54.997098: step: 1212/530, loss: 0.013338254764676094 2023-01-24 08:43:56.041360: step: 1216/530, loss: 0.008043644949793816 2023-01-24 08:43:57.082609: step: 1220/530, loss: 0.0032047561835497618 2023-01-24 08:43:58.120440: step: 1224/530, loss: 3.533139897626825e-05 2023-01-24 08:43:59.176526: step: 1228/530, loss: 0.004353194963186979 2023-01-24 08:44:00.242184: step: 1232/530, loss: 0.0011323824292048812 2023-01-24 08:44:01.299982: step: 1236/530, loss: 0.00013187172589823604 2023-01-24 08:44:02.356170: step: 1240/530, loss: 0.000815546081867069 2023-01-24 08:44:03.411304: step: 1244/530, loss: 0.004494329448789358 2023-01-24 08:44:04.448201: step: 1248/530, loss: 0.00019237086235079914 2023-01-24 08:44:05.481332: step: 1252/530, loss: 0.0023239210713654757 2023-01-24 08:44:06.541133: step: 1256/530, loss: 0.001449662260711193 2023-01-24 08:44:07.570560: step: 1260/530, loss: 9.828144357015844e-06 2023-01-24 08:44:08.624856: step: 1264/530, loss: 0.006015796214342117 2023-01-24 08:44:09.682481: step: 1268/530, loss: 0.0027719291392713785 2023-01-24 08:44:10.722072: step: 1272/530, loss: 0.0003320998512208462 2023-01-24 08:44:11.769015: step: 1276/530, loss: 0.0001519552170066163 2023-01-24 08:44:12.799401: step: 1280/530, loss: 5.461227192427032e-05 2023-01-24 08:44:13.850500: step: 1284/530, loss: 0.002218343084678054 2023-01-24 08:44:14.896827: step: 1288/530, loss: 7.999590889085084e-05 2023-01-24 08:44:15.934606: step: 1292/530, loss: 0.002180244540795684 2023-01-24 08:44:16.970542: step: 1296/530, loss: 0.0031195455230772495 2023-01-24 08:44:18.014251: step: 1300/530, loss: 0.00729980506002903 2023-01-24 08:44:19.059587: step: 1304/530, loss: 0.0004911327268928289 2023-01-24 08:44:20.096497: step: 1308/530, loss: 0.004196009133011103 2023-01-24 08:44:21.134878: step: 1312/530, loss: 0.0036911985371261835 2023-01-24 08:44:22.172812: step: 1316/530, loss: 0.0025881011970341206 2023-01-24 08:44:23.223891: step: 1320/530, loss: 8.970306953415275e-05 2023-01-24 08:44:24.276948: step: 1324/530, loss: 0.0012659200001507998 2023-01-24 08:44:25.327926: step: 1328/530, loss: 0.00011973016808042303 2023-01-24 08:44:26.391361: step: 1332/530, loss: 1.3773040336673148e-05 2023-01-24 08:44:27.426857: step: 1336/530, loss: 0.0023343595676124096 2023-01-24 08:44:28.467852: step: 1340/530, loss: 0.005378260277211666 2023-01-24 08:44:29.493521: step: 1344/530, loss: 1.0857224879146088e-06 2023-01-24 08:44:30.522907: step: 1348/530, loss: 0.0007610554457642138 2023-01-24 08:44:31.562604: step: 1352/530, loss: 9.709344885777682e-05 2023-01-24 08:44:32.603606: step: 1356/530, loss: 0.0 2023-01-24 08:44:33.645673: step: 1360/530, loss: 1.2003538074623066e-07 2023-01-24 08:44:34.694449: step: 1364/530, loss: 0.0001666335592744872 2023-01-24 08:44:35.739038: step: 1368/530, loss: 0.005986809730529785 2023-01-24 08:44:36.782627: step: 1372/530, loss: 0.0008152473019436002 2023-01-24 08:44:37.826945: step: 1376/530, loss: 6.772181677661138e-07 2023-01-24 08:44:38.868690: step: 1380/530, loss: 0.016878999769687653 2023-01-24 08:44:39.910904: step: 1384/530, loss: 0.0006100684404373169 2023-01-24 08:44:40.963888: step: 1388/530, loss: 0.0013175173662602901 2023-01-24 08:44:41.999695: step: 1392/530, loss: 0.000431124703027308 2023-01-24 08:44:43.044893: step: 1396/530, loss: 1.8923074094345793e-06 2023-01-24 08:44:44.082249: step: 1400/530, loss: 0.0026847615372389555 2023-01-24 08:44:45.121740: step: 1404/530, loss: 0.0049303616397082806 2023-01-24 08:44:46.151830: step: 1408/530, loss: 0.0003786585293710232 2023-01-24 08:44:47.193026: step: 1412/530, loss: 0.0028419815935194492 2023-01-24 08:44:48.227277: step: 1416/530, loss: 0.0011984541779384017 2023-01-24 08:44:49.274449: step: 1420/530, loss: 7.219785038614646e-05 2023-01-24 08:44:50.312853: step: 1424/530, loss: 0.004033208824694157 2023-01-24 08:44:51.362195: step: 1428/530, loss: 0.02244948036968708 2023-01-24 08:44:52.402987: step: 1432/530, loss: 0.007330878637731075 2023-01-24 08:44:53.447471: step: 1436/530, loss: 0.004972193855792284 2023-01-24 08:44:54.490373: step: 1440/530, loss: 4.1494113247608766e-05 2023-01-24 08:44:55.558861: step: 1444/530, loss: 0.0028021596372127533 2023-01-24 08:44:56.610738: step: 1448/530, loss: 0.0029528236482292414 2023-01-24 08:44:57.638340: step: 1452/530, loss: 0.0008357432670891285 2023-01-24 08:44:58.679151: step: 1456/530, loss: 0.0011378773488104343 2023-01-24 08:44:59.714073: step: 1460/530, loss: 0.009751907549798489 2023-01-24 08:45:00.752276: step: 1464/530, loss: 0.0014992222422733903 2023-01-24 08:45:01.809001: step: 1468/530, loss: 0.002464254852384329 2023-01-24 08:45:02.854878: step: 1472/530, loss: 3.395184830878861e-05 2023-01-24 08:45:03.919135: step: 1476/530, loss: 0.004051372408866882 2023-01-24 08:45:04.952887: step: 1480/530, loss: 0.0015022637089714408 2023-01-24 08:45:05.987895: step: 1484/530, loss: 0.004045954905450344 2023-01-24 08:45:07.038953: step: 1488/530, loss: 0.004026063717901707 2023-01-24 08:45:08.082675: step: 1492/530, loss: 2.733970177359879e-05 2023-01-24 08:45:09.136839: step: 1496/530, loss: 0.005752569530159235 2023-01-24 08:45:10.198370: step: 1500/530, loss: 0.0016751571092754602 2023-01-24 08:45:11.253504: step: 1504/530, loss: 0.002858343068510294 2023-01-24 08:45:12.287557: step: 1508/530, loss: 0.0002025643625529483 2023-01-24 08:45:13.323733: step: 1512/530, loss: 0.004421581048518419 2023-01-24 08:45:14.381563: step: 1516/530, loss: 0.00011061177065130323 2023-01-24 08:45:15.411676: step: 1520/530, loss: 0.0016932482831180096 2023-01-24 08:45:16.445068: step: 1524/530, loss: 0.00027803966077044606 2023-01-24 08:45:17.470056: step: 1528/530, loss: 0.001186358043923974 2023-01-24 08:45:18.503947: step: 1532/530, loss: 0.0011938621755689383 2023-01-24 08:45:19.544027: step: 1536/530, loss: 0.0001307249185629189 2023-01-24 08:45:20.583452: step: 1540/530, loss: 0.000702088582329452 2023-01-24 08:45:21.622395: step: 1544/530, loss: 0.0026872078888118267 2023-01-24 08:45:22.660882: step: 1548/530, loss: 0.00996373686939478 2023-01-24 08:45:23.700979: step: 1552/530, loss: 0.0012249033898115158 2023-01-24 08:45:24.743081: step: 1556/530, loss: 0.0033129968214780092 2023-01-24 08:45:25.790406: step: 1560/530, loss: 0.0001788036315701902 2023-01-24 08:45:26.817171: step: 1564/530, loss: 0.0005180523148737848 2023-01-24 08:45:27.856449: step: 1568/530, loss: 0.008451927453279495 2023-01-24 08:45:28.896272: step: 1572/530, loss: 5.736790598120933e-08 2023-01-24 08:45:29.963178: step: 1576/530, loss: 0.00038226452306844294 2023-01-24 08:45:31.020862: step: 1580/530, loss: 0.0011892697075381875 2023-01-24 08:45:32.063334: step: 1584/530, loss: 1.6682479326846078e-05 2023-01-24 08:45:33.096382: step: 1588/530, loss: 0.0036256397143006325 2023-01-24 08:45:34.127352: step: 1592/530, loss: 5.045654688728973e-06 2023-01-24 08:45:35.156407: step: 1596/530, loss: 0.0005896550719626248 2023-01-24 08:45:36.188526: step: 1600/530, loss: 0.005167139694094658 2023-01-24 08:45:37.234263: step: 1604/530, loss: 0.009650243446230888 2023-01-24 08:45:38.294699: step: 1608/530, loss: 0.0011538421967998147 2023-01-24 08:45:39.349199: step: 1612/530, loss: 0.0001134164776885882 2023-01-24 08:45:40.399431: step: 1616/530, loss: 0.002002834342420101 2023-01-24 08:45:41.434236: step: 1620/530, loss: 0.0014718525344505906 2023-01-24 08:45:42.459690: step: 1624/530, loss: 0.00032226493931375444 2023-01-24 08:45:43.515480: step: 1628/530, loss: 0.006582689471542835 2023-01-24 08:45:44.550131: step: 1632/530, loss: 1.0673220458556898e-05 2023-01-24 08:45:45.605307: step: 1636/530, loss: 0.005204511806368828 2023-01-24 08:45:46.664630: step: 1640/530, loss: 0.0005761709180660546 2023-01-24 08:45:47.725623: step: 1644/530, loss: 0.00013568585563916713 2023-01-24 08:45:48.797887: step: 1648/530, loss: 0.002421013545244932 2023-01-24 08:45:49.834309: step: 1652/530, loss: 0.0002153374080080539 2023-01-24 08:45:50.873237: step: 1656/530, loss: 0.001389373210258782 2023-01-24 08:45:51.920377: step: 1660/530, loss: 0.001180328894406557 2023-01-24 08:45:52.981611: step: 1664/530, loss: 0.004765115678310394 2023-01-24 08:45:54.010339: step: 1668/530, loss: 0.011473272927105427 2023-01-24 08:45:55.079942: step: 1672/530, loss: 0.00356234866194427 2023-01-24 08:45:56.123497: step: 1676/530, loss: 0.007072188891470432 2023-01-24 08:45:57.170913: step: 1680/530, loss: 0.0021764098200947046 2023-01-24 08:45:58.228014: step: 1684/530, loss: 0.00010520782961975783 2023-01-24 08:45:59.265381: step: 1688/530, loss: 0.001124878996051848 2023-01-24 08:46:00.308270: step: 1692/530, loss: 0.0007139877998270094 2023-01-24 08:46:01.344135: step: 1696/530, loss: 0.0 2023-01-24 08:46:02.404556: step: 1700/530, loss: 0.0017955448711290956 2023-01-24 08:46:03.467133: step: 1704/530, loss: 9.446531294088345e-06 2023-01-24 08:46:04.519620: step: 1708/530, loss: 3.950011887354776e-05 2023-01-24 08:46:05.571821: step: 1712/530, loss: 0.00271967938169837 2023-01-24 08:46:06.599025: step: 1716/530, loss: 0.0005915315705351532 2023-01-24 08:46:07.662193: step: 1720/530, loss: 8.707438973942772e-05 2023-01-24 08:46:08.720749: step: 1724/530, loss: 0.001272302703000605 2023-01-24 08:46:09.767741: step: 1728/530, loss: 0.00048801334924064577 2023-01-24 08:46:10.808260: step: 1732/530, loss: 0.0005772834992967546 2023-01-24 08:46:11.867853: step: 1736/530, loss: 0.0004037150356452912 2023-01-24 08:46:12.911794: step: 1740/530, loss: 0.0006433365633711219 2023-01-24 08:46:13.940041: step: 1744/530, loss: 0.0009077931172214448 2023-01-24 08:46:14.990077: step: 1748/530, loss: 0.00032269800431095064 2023-01-24 08:46:16.026733: step: 1752/530, loss: 0.0003715303319040686 2023-01-24 08:46:17.075152: step: 1756/530, loss: 0.032732587307691574 2023-01-24 08:46:18.119418: step: 1760/530, loss: 0.0027986119966953993 2023-01-24 08:46:19.178210: step: 1764/530, loss: 0.00505076115950942 2023-01-24 08:46:20.221681: step: 1768/530, loss: 0.0034972019493579865 2023-01-24 08:46:21.283223: step: 1772/530, loss: 0.010578633286058903 2023-01-24 08:46:22.339569: step: 1776/530, loss: 0.003582973964512348 2023-01-24 08:46:23.429188: step: 1780/530, loss: 0.006506519857794046 2023-01-24 08:46:24.473716: step: 1784/530, loss: 0.0018352270126342773 2023-01-24 08:46:25.520665: step: 1788/530, loss: 0.0013394705019891262 2023-01-24 08:46:26.572152: step: 1792/530, loss: 0.0013189377496019006 2023-01-24 08:46:27.604662: step: 1796/530, loss: 0.00013744382886216044 2023-01-24 08:46:28.651997: step: 1800/530, loss: 0.005391889251768589 2023-01-24 08:46:29.696681: step: 1804/530, loss: 0.011479792185127735 2023-01-24 08:46:30.738090: step: 1808/530, loss: 5.284298458718695e-05 2023-01-24 08:46:31.778500: step: 1812/530, loss: 0.0025754254311323166 2023-01-24 08:46:32.804484: step: 1816/530, loss: 0.00801665149629116 2023-01-24 08:46:33.880839: step: 1820/530, loss: 0.0005745472153648734 2023-01-24 08:46:34.943909: step: 1824/530, loss: 0.006258128676563501 2023-01-24 08:46:35.996738: step: 1828/530, loss: 0.0145878279581666 2023-01-24 08:46:37.078647: step: 1832/530, loss: 0.004535536281764507 2023-01-24 08:46:38.117568: step: 1836/530, loss: 0.0010435067815706134 2023-01-24 08:46:39.158950: step: 1840/530, loss: 0.0018674947787076235 2023-01-24 08:46:40.205951: step: 1844/530, loss: 0.014176220633089542 2023-01-24 08:46:41.252584: step: 1848/530, loss: 0.0014461047248914838 2023-01-24 08:46:42.300370: step: 1852/530, loss: 0.004165360704064369 2023-01-24 08:46:43.332334: step: 1856/530, loss: 0.005053696688264608 2023-01-24 08:46:44.386939: step: 1860/530, loss: 1.737669481371995e-05 2023-01-24 08:46:45.418485: step: 1864/530, loss: 0.0047654276713728905 2023-01-24 08:46:46.451650: step: 1868/530, loss: 0.0006152056157588959 2023-01-24 08:46:47.486312: step: 1872/530, loss: 0.0002627117501106113 2023-01-24 08:46:48.542666: step: 1876/530, loss: 0.0010582341346889734 2023-01-24 08:46:49.593416: step: 1880/530, loss: 1.377479321718056e-07 2023-01-24 08:46:50.637517: step: 1884/530, loss: 6.542880328197498e-06 2023-01-24 08:46:51.658803: step: 1888/530, loss: 0.01235949993133545 2023-01-24 08:46:52.696484: step: 1892/530, loss: 0.00010742411541286856 2023-01-24 08:46:53.740644: step: 1896/530, loss: 0.00777466082945466 2023-01-24 08:46:54.767434: step: 1900/530, loss: 0.0027790055610239506 2023-01-24 08:46:55.812571: step: 1904/530, loss: 0.0025619480293244123 2023-01-24 08:46:56.852598: step: 1908/530, loss: 0.0007179515087045729 2023-01-24 08:46:57.891413: step: 1912/530, loss: 0.0018334188498556614 2023-01-24 08:46:58.926590: step: 1916/530, loss: 0.0034390143118798733 2023-01-24 08:46:59.976114: step: 1920/530, loss: 0.0011282347841188312 2023-01-24 08:47:01.021436: step: 1924/530, loss: 0.020094776526093483 2023-01-24 08:47:02.048507: step: 1928/530, loss: 0.00018194942094851285 2023-01-24 08:47:03.096042: step: 1932/530, loss: 1.9138960851705633e-05 2023-01-24 08:47:04.147629: step: 1936/530, loss: 0.0009774244390428066 2023-01-24 08:47:05.178590: step: 1940/530, loss: 0.0002496328379493207 2023-01-24 08:47:06.208590: step: 1944/530, loss: 0.017487987875938416 2023-01-24 08:47:07.258783: step: 1948/530, loss: 0.000737216672860086 2023-01-24 08:47:08.307070: step: 1952/530, loss: 0.016520904377102852 2023-01-24 08:47:09.371790: step: 1956/530, loss: 0.01425775233656168 2023-01-24 08:47:10.413526: step: 1960/530, loss: 1.270201028091833e-05 2023-01-24 08:47:11.474993: step: 1964/530, loss: 0.050946805626153946 2023-01-24 08:47:12.520185: step: 1968/530, loss: 0.007083595730364323 2023-01-24 08:47:13.584230: step: 1972/530, loss: 0.00011740416084649041 2023-01-24 08:47:14.631991: step: 1976/530, loss: 0.0014218618161976337 2023-01-24 08:47:15.668271: step: 1980/530, loss: 0.00011127001198474318 2023-01-24 08:47:16.711399: step: 1984/530, loss: 0.0009608388063497841 2023-01-24 08:47:17.747948: step: 1988/530, loss: 0.017436038702726364 2023-01-24 08:47:18.809387: step: 1992/530, loss: 0.0 2023-01-24 08:47:19.861251: step: 1996/530, loss: 0.005568573717027903 2023-01-24 08:47:20.895737: step: 2000/530, loss: 0.005121793132275343 2023-01-24 08:47:21.925457: step: 2004/530, loss: 0.001218840479850769 2023-01-24 08:47:22.967184: step: 2008/530, loss: 0.0003862846933770925 2023-01-24 08:47:23.993319: step: 2012/530, loss: 0.0006322905537672341 2023-01-24 08:47:25.032992: step: 2016/530, loss: 0.0014480248792096972 2023-01-24 08:47:26.093728: step: 2020/530, loss: 0.0038923274260014296 2023-01-24 08:47:27.140125: step: 2024/530, loss: 0.0040010022930800915 2023-01-24 08:47:28.174176: step: 2028/530, loss: 0.011293146759271622 2023-01-24 08:47:29.223416: step: 2032/530, loss: 0.0035857250913977623 2023-01-24 08:47:30.260248: step: 2036/530, loss: 0.0004058224440086633 2023-01-24 08:47:31.306683: step: 2040/530, loss: 0.0037106696981936693 2023-01-24 08:47:32.340355: step: 2044/530, loss: 0.00032576799276284873 2023-01-24 08:47:33.392526: step: 2048/530, loss: 1.199520482941807e-07 2023-01-24 08:47:34.435736: step: 2052/530, loss: 0.0009816251695156097 2023-01-24 08:47:35.479957: step: 2056/530, loss: 0.0001089588986360468 2023-01-24 08:47:36.527320: step: 2060/530, loss: 0.0029616826213896275 2023-01-24 08:47:37.563829: step: 2064/530, loss: 0.02165575884282589 2023-01-24 08:47:38.598791: step: 2068/530, loss: 0.0021646814420819283 2023-01-24 08:47:39.633476: step: 2072/530, loss: 0.0010730999056249857 2023-01-24 08:47:40.671221: step: 2076/530, loss: 0.0001871632266556844 2023-01-24 08:47:41.704031: step: 2080/530, loss: 0.0014424140099436045 2023-01-24 08:47:42.742968: step: 2084/530, loss: 0.0009144091163761914 2023-01-24 08:47:43.792188: step: 2088/530, loss: 0.002994795562699437 2023-01-24 08:47:44.837879: step: 2092/530, loss: 0.00024580780882388353 2023-01-24 08:47:45.873399: step: 2096/530, loss: 0.00043128005927428603 2023-01-24 08:47:46.903061: step: 2100/530, loss: 0.00038046660483814776 2023-01-24 08:47:47.947487: step: 2104/530, loss: 0.006865813862532377 2023-01-24 08:47:48.987663: step: 2108/530, loss: 3.880581971316133e-06 2023-01-24 08:47:50.026081: step: 2112/530, loss: 0.0022267343010753393 2023-01-24 08:47:51.053566: step: 2116/530, loss: 0.02534710057079792 2023-01-24 08:47:52.078869: step: 2120/530, loss: 0.0003853960952255875 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3691397550111359, 'r': 0.3145042694497154, 'f1': 0.3396388319672131}, 'combined': 0.2502601919758412, 'stategy': 1, 'epoch': 19} Test Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37510459577985067, 'r': 0.3916533279466088, 'f1': 0.38320037842258126}, 'combined': 0.2970261306433405, 'stategy': 1, 'epoch': 19} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3892996341075406, 'r': 0.3316803334236921, 'f1': 0.3581875731850117}, 'combined': 0.26392768550474544, 'stategy': 1, 'epoch': 19} Test Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3732746852014944, 'r': 0.37053001839854227, 'f1': 0.37189728783912734}, 'combined': 0.2882648833968356, 'stategy': 1, 'epoch': 19} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.38297703353635176, 'r': 0.33283393047371745, 'f1': 0.35614920073025197}, 'combined': 0.26242572685386983, 'stategy': 1, 'epoch': 19} Test Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.36358499223691937, 'r': 0.36391916961949006, 'f1': 0.3637520041763943}, 'combined': 0.2819513142419899, 'stategy': 1, 'epoch': 19} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 19} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.475, 'r': 0.41304347826086957, 'f1': 0.44186046511627913}, 'combined': 0.22093023255813957, 'stategy': 1, 'epoch': 19} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 19} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.37786862527716186, 'r': 0.32337523719165084, 'f1': 0.3485046012269939}, 'combined': 0.2567928640619955, 'stategy': 1, 'epoch': 12} Test for Chinese: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.37377987703702326, 'r': 0.38889597500543227, 'f1': 0.3811881268521715}, 'combined': 0.2954663949763244, 'stategy': 1, 'epoch': 12} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.4230769230769231, 'r': 0.3142857142857143, 'f1': 0.360655737704918}, 'combined': 0.24043715846994532, 'stategy': 1, 'epoch': 12} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3861756951102589, 'r': 0.32755319869883437, 'f1': 0.3544569521853916}, 'combined': 0.2611788068734464, 'stategy': 1, 'epoch': 2} Test for Korean: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3702915838099576, 'r': 0.3696109007514834, 'f1': 0.36995092917903766}, 'combined': 0.28675622261724454, 'stategy': 1, 'epoch': 2} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.5125, 'r': 0.44565217391304346, 'f1': 0.47674418604651164}, 'combined': 0.23837209302325582, 'stategy': 1, 'epoch': 2} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3851604396498889, 'r': 0.33473146368054857, 'f1': 0.3581796575830439}, 'combined': 0.26392185295592707, 'stategy': 1, 'epoch': 15} Test for Russian: {'template': {'p': 0.9418604651162791, 'r': 0.6585365853658537, 'f1': 0.7751196172248804}, 'slot': {'p': 0.3640887768447368, 'r': 0.3620809343253724, 'f1': 0.3630820797659034}, 'combined': 0.28143204268936056, 'stategy': 1, 'epoch': 15} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.6486842105263158, 'r': 0.22368421052631576, 'f1': 0.3326585695006748}, 'combined': 0.22177237966711652, 'stategy': 1, 'epoch': 15}