Command that produces this log: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 ---------------------------------------------------------------------------------------------------- > trainable params: >>> xlmr.embeddings.word_embeddings.weight: torch.Size([250002, 1024]) >>> xlmr.embeddings.position_embeddings.weight: torch.Size([514, 1024]) >>> xlmr.embeddings.token_type_embeddings.weight: torch.Size([1, 1024]) >>> xlmr.embeddings.LayerNorm.weight: torch.Size([1024]) >>> xlmr.embeddings.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.0.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.0.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.0.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.0.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.0.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.0.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.0.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.1.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.1.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.1.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.1.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.1.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.1.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.1.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.2.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.2.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.2.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.2.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.2.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.2.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.2.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.3.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.3.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.3.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.3.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.3.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.3.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.3.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.4.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.4.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.4.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.4.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.4.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.4.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.4.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.5.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.5.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.5.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.5.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.5.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.5.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.5.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.6.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.6.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.6.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.6.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.6.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.6.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.6.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.7.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.7.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.7.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.7.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.7.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.7.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.7.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.8.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.8.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.8.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.8.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.8.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.8.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.8.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.9.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.9.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.9.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.9.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.9.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.9.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.9.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.10.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.10.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.10.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.10.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.10.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.10.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.10.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.11.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.11.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.11.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.11.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.11.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.11.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.11.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.12.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.12.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.12.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.12.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.12.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.12.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.12.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.13.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.13.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.13.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.13.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.13.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.13.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.13.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.14.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.14.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.14.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.14.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.14.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.14.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.14.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.15.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.15.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.15.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.15.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.15.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.15.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.15.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.16.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.16.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.16.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.16.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.16.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.16.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.16.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.17.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.17.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.17.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.17.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.17.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.17.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.17.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.18.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.18.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.18.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.18.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.18.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.18.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.18.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.19.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.19.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.19.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.19.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.19.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.19.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.19.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.20.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.20.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.20.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.20.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.20.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.20.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.20.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.21.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.21.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.21.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.21.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.21.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.21.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.21.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.22.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.22.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.22.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.22.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.22.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.22.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.22.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.query.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.query.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.key.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.key.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.self.value.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.self.value.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.dense.weight: torch.Size([1024, 1024]) >>> xlmr.encoder.layer.23.attention.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.23.attention.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.intermediate.dense.weight: torch.Size([4096, 1024]) >>> xlmr.encoder.layer.23.intermediate.dense.bias: torch.Size([4096]) >>> xlmr.encoder.layer.23.output.dense.weight: torch.Size([1024, 4096]) >>> xlmr.encoder.layer.23.output.dense.bias: torch.Size([1024]) >>> xlmr.encoder.layer.23.output.LayerNorm.weight: torch.Size([1024]) >>> xlmr.encoder.layer.23.output.LayerNorm.bias: torch.Size([1024]) >>> xlmr.pooler.dense.weight: torch.Size([1024, 1024]) >>> xlmr.pooler.dense.bias: torch.Size([1024]) >>> type_embedding.weight: torch.Size([123, 100]) >>> trans_rep.weight: torch.Size([1024, 1124]) >>> trans_rep.bias: torch.Size([1024]) >>> coref_type_ffn.weight: torch.Size([3, 4096]) >>> coref_type_ffn.bias: torch.Size([3]) n_trainable_params: 561067023, n_nontrainable_params: 0 ---------------------------------------------------------------------------------------------------- ****************************** Epoch: 0 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 17:00:24.015955: step: 4/530, loss: 0.011467501521110535 2023-01-22 17:00:25.102176: step: 8/530, loss: 0.014485727064311504 2023-01-22 17:00:26.170014: step: 12/530, loss: 0.02021254412829876 2023-01-22 17:00:27.248254: step: 16/530, loss: 0.014981972053647041 2023-01-22 17:00:28.333356: step: 20/530, loss: 0.013090364634990692 2023-01-22 17:00:29.399388: step: 24/530, loss: 0.021329078823328018 2023-01-22 17:00:30.484770: step: 28/530, loss: 0.015183400362730026 2023-01-22 17:00:31.622160: step: 32/530, loss: 0.03845686465501785 2023-01-22 17:00:32.705340: step: 36/530, loss: 0.04434531182050705 2023-01-22 17:00:33.808622: step: 40/530, loss: 0.03982289880514145 2023-01-22 17:00:34.911007: step: 44/530, loss: 0.015156283974647522 2023-01-22 17:00:36.007477: step: 48/530, loss: 0.03714491426944733 2023-01-22 17:00:37.097299: step: 52/530, loss: 0.04233403503894806 2023-01-22 17:00:38.186549: step: 56/530, loss: 0.08096525073051453 2023-01-22 17:00:39.277141: step: 60/530, loss: 0.027153439819812775 2023-01-22 17:00:40.391809: step: 64/530, loss: 0.04382731020450592 2023-01-22 17:00:41.507384: step: 68/530, loss: 0.025821052491664886 2023-01-22 17:00:42.583551: step: 72/530, loss: 0.05722580477595329 2023-01-22 17:00:43.652861: step: 76/530, loss: 0.014848173595964909 2023-01-22 17:00:44.781754: step: 80/530, loss: 0.03056863322854042 2023-01-22 17:00:45.878529: step: 84/530, loss: 0.02284967713057995 2023-01-22 17:00:46.965543: step: 88/530, loss: 0.01969929039478302 2023-01-22 17:00:48.058850: step: 92/530, loss: 0.027563055977225304 2023-01-22 17:00:49.145589: step: 96/530, loss: 0.04755375534296036 2023-01-22 17:00:50.230242: step: 100/530, loss: 0.017107253894209862 2023-01-22 17:00:51.311419: step: 104/530, loss: 0.01470103021711111 2023-01-22 17:00:52.412741: step: 108/530, loss: 0.05741553008556366 2023-01-22 17:00:53.488517: step: 112/530, loss: 0.05990713834762573 2023-01-22 17:00:54.552926: step: 116/530, loss: 0.010556021705269814 2023-01-22 17:00:55.649600: step: 120/530, loss: 0.022959887981414795 2023-01-22 17:00:56.741027: step: 124/530, loss: 0.01252189464867115 2023-01-22 17:00:57.822363: step: 128/530, loss: 0.019330689683556557 2023-01-22 17:00:58.885714: step: 132/530, loss: 0.0162226390093565 2023-01-22 17:00:59.972875: step: 136/530, loss: 0.061574190855026245 2023-01-22 17:01:01.081701: step: 140/530, loss: 0.027933664619922638 2023-01-22 17:01:02.207181: step: 144/530, loss: 0.015939706936478615 2023-01-22 17:01:03.309133: step: 148/530, loss: 0.08044497668743134 2023-01-22 17:01:04.393554: step: 152/530, loss: 0.03180399909615517 2023-01-22 17:01:05.474652: step: 156/530, loss: 0.016494816169142723 2023-01-22 17:01:06.547781: step: 160/530, loss: 0.01672021672129631 2023-01-22 17:01:07.634516: step: 164/530, loss: 0.023755937814712524 2023-01-22 17:01:08.714288: step: 168/530, loss: 0.014235143549740314 2023-01-22 17:01:09.800897: step: 172/530, loss: 0.018145011737942696 2023-01-22 17:01:10.905742: step: 176/530, loss: 0.019230917096138 2023-01-22 17:01:11.995675: step: 180/530, loss: 0.032779112458229065 2023-01-22 17:01:13.074852: step: 184/530, loss: 0.0101863332092762 2023-01-22 17:01:14.154958: step: 188/530, loss: 0.0157422237098217 2023-01-22 17:01:15.252923: step: 192/530, loss: 0.006937301717698574 2023-01-22 17:01:16.352300: step: 196/530, loss: 0.05183155834674835 2023-01-22 17:01:17.427820: step: 200/530, loss: 0.05829997733235359 2023-01-22 17:01:18.532384: step: 204/530, loss: 0.010822414420545101 2023-01-22 17:01:19.613649: step: 208/530, loss: 0.05365070700645447 2023-01-22 17:01:20.709775: step: 212/530, loss: 0.011589542962610722 2023-01-22 17:01:21.801991: step: 216/530, loss: 0.018661417067050934 2023-01-22 17:01:22.888113: step: 220/530, loss: 0.0364769771695137 2023-01-22 17:01:23.968460: step: 224/530, loss: 0.05967678129673004 2023-01-22 17:01:25.055185: step: 228/530, loss: 0.02332700416445732 2023-01-22 17:01:26.132098: step: 232/530, loss: 0.01643318310379982 2023-01-22 17:01:27.204250: step: 236/530, loss: 0.01622905768454075 2023-01-22 17:01:28.276123: step: 240/530, loss: 0.014846382662653923 2023-01-22 17:01:29.372476: step: 244/530, loss: 0.021980928257107735 2023-01-22 17:01:30.460451: step: 248/530, loss: 0.04995280131697655 2023-01-22 17:01:31.553455: step: 252/530, loss: 0.008162538520991802 2023-01-22 17:01:32.651957: step: 256/530, loss: 0.013937925919890404 2023-01-22 17:01:33.721480: step: 260/530, loss: 0.021493133157491684 2023-01-22 17:01:34.816496: step: 264/530, loss: 0.011338409967720509 2023-01-22 17:01:35.924344: step: 268/530, loss: 0.012696531601250172 2023-01-22 17:01:37.065660: step: 272/530, loss: 0.011421488597989082 2023-01-22 17:01:38.154752: step: 276/530, loss: 0.03716360032558441 2023-01-22 17:01:39.236582: step: 280/530, loss: 0.014100338332355022 2023-01-22 17:01:40.349101: step: 284/530, loss: 0.011375023052096367 2023-01-22 17:01:41.417082: step: 288/530, loss: 0.008520003408193588 2023-01-22 17:01:42.559263: step: 292/530, loss: 0.010339656844735146 2023-01-22 17:01:43.629959: step: 296/530, loss: 0.012516725808382034 2023-01-22 17:01:44.699839: step: 300/530, loss: 0.009284278377890587 2023-01-22 17:01:45.796294: step: 304/530, loss: 0.013679335825145245 2023-01-22 17:01:46.882054: step: 308/530, loss: 0.013499300926923752 2023-01-22 17:01:48.011792: step: 312/530, loss: 0.02213696762919426 2023-01-22 17:01:49.083238: step: 316/530, loss: 0.0557267889380455 2023-01-22 17:01:50.183030: step: 320/530, loss: 0.016188064590096474 2023-01-22 17:01:51.271100: step: 324/530, loss: 0.010495403781533241 2023-01-22 17:01:52.394800: step: 328/530, loss: 0.05542273446917534 2023-01-22 17:01:53.472884: step: 332/530, loss: 0.018293123692274094 2023-01-22 17:01:54.560232: step: 336/530, loss: 0.047707267105579376 2023-01-22 17:01:55.645496: step: 340/530, loss: 0.04012608528137207 2023-01-22 17:01:56.735930: step: 344/530, loss: 0.010144260711967945 2023-01-22 17:01:57.848731: step: 348/530, loss: 0.0537719689309597 2023-01-22 17:01:58.955865: step: 352/530, loss: 0.030783772468566895 2023-01-22 17:02:00.052591: step: 356/530, loss: 0.013567428104579449 2023-01-22 17:02:01.131555: step: 360/530, loss: 0.015386553481221199 2023-01-22 17:02:02.223826: step: 364/530, loss: 0.048650193959474564 2023-01-22 17:02:03.312652: step: 368/530, loss: 0.05116035416722298 2023-01-22 17:02:04.382307: step: 372/530, loss: 0.040121253579854965 2023-01-22 17:02:05.468901: step: 376/530, loss: 0.003961693029850721 2023-01-22 17:02:06.540867: step: 380/530, loss: 0.024890054017305374 2023-01-22 17:02:07.639557: step: 384/530, loss: 0.009636261500418186 2023-01-22 17:02:08.753276: step: 388/530, loss: 0.050982046872377396 2023-01-22 17:02:09.837466: step: 392/530, loss: 0.010965893976390362 2023-01-22 17:02:10.930736: step: 396/530, loss: 0.018137114122509956 2023-01-22 17:02:12.032001: step: 400/530, loss: 0.03513287007808685 2023-01-22 17:02:13.112038: step: 404/530, loss: 0.009723388589918613 2023-01-22 17:02:14.225397: step: 408/530, loss: 0.009628687053918839 2023-01-22 17:02:15.336851: step: 412/530, loss: 0.011322302743792534 2023-01-22 17:02:16.465855: step: 416/530, loss: 0.015155560337007046 2023-01-22 17:02:17.557172: step: 420/530, loss: 0.05574380233883858 2023-01-22 17:02:18.629023: step: 424/530, loss: 0.031009312719106674 2023-01-22 17:02:19.726151: step: 428/530, loss: 0.009676420129835606 2023-01-22 17:02:20.813926: step: 432/530, loss: 0.01221969723701477 2023-01-22 17:02:21.919730: step: 436/530, loss: 0.017525238916277885 2023-01-22 17:02:23.003418: step: 440/530, loss: 0.021521715447306633 2023-01-22 17:02:24.065476: step: 444/530, loss: 0.05986635386943817 2023-01-22 17:02:25.149949: step: 448/530, loss: 0.012541204690933228 2023-01-22 17:02:26.236535: step: 452/530, loss: 0.020448947325348854 2023-01-22 17:02:27.336311: step: 456/530, loss: 0.009558239951729774 2023-01-22 17:02:28.457277: step: 460/530, loss: 0.05682926997542381 2023-01-22 17:02:29.540713: step: 464/530, loss: 0.01390343252569437 2023-01-22 17:02:30.653668: step: 468/530, loss: 0.011025974527001381 2023-01-22 17:02:31.717844: step: 472/530, loss: 0.01932631805539131 2023-01-22 17:02:32.807724: step: 476/530, loss: 0.035168226808309555 2023-01-22 17:02:33.908327: step: 480/530, loss: 0.015916112810373306 2023-01-22 17:02:35.011094: step: 484/530, loss: 0.033374249935150146 2023-01-22 17:02:36.089673: step: 488/530, loss: 0.07296033948659897 2023-01-22 17:02:37.206046: step: 492/530, loss: 0.037825677543878555 2023-01-22 17:02:38.288195: step: 496/530, loss: 0.014952165074646473 2023-01-22 17:02:39.413182: step: 500/530, loss: 0.005028252024203539 2023-01-22 17:02:40.513840: step: 504/530, loss: 0.07204002141952515 2023-01-22 17:02:41.595685: step: 508/530, loss: 0.0398731455206871 2023-01-22 17:02:42.675258: step: 512/530, loss: 0.025840265676379204 2023-01-22 17:02:43.757009: step: 516/530, loss: 0.018875647336244583 2023-01-22 17:02:44.847654: step: 520/530, loss: 0.008626456372439861 2023-01-22 17:02:45.915934: step: 524/530, loss: 0.021149303764104843 2023-01-22 17:02:47.017274: step: 528/530, loss: 0.062265027314424515 2023-01-22 17:02:48.113952: step: 532/530, loss: 0.01840990222990513 2023-01-22 17:02:49.220624: step: 536/530, loss: 0.008780206553637981 2023-01-22 17:02:50.311682: step: 540/530, loss: 0.03259558603167534 2023-01-22 17:02:51.398115: step: 544/530, loss: 0.051471538841724396 2023-01-22 17:02:52.480377: step: 548/530, loss: 0.014503030106425285 2023-01-22 17:02:53.585574: step: 552/530, loss: 0.01766877993941307 2023-01-22 17:02:54.678943: step: 556/530, loss: 0.011895626783370972 2023-01-22 17:02:55.791080: step: 560/530, loss: 0.01722758449614048 2023-01-22 17:02:56.887474: step: 564/530, loss: 0.047568801790475845 2023-01-22 17:02:57.987176: step: 568/530, loss: 0.02621176652610302 2023-01-22 17:02:59.093072: step: 572/530, loss: 0.04431449621915817 2023-01-22 17:03:00.195843: step: 576/530, loss: 0.007582752034068108 2023-01-22 17:03:01.259243: step: 580/530, loss: 0.009157495573163033 2023-01-22 17:03:02.362404: step: 584/530, loss: 0.023113993927836418 2023-01-22 17:03:03.486842: step: 588/530, loss: 0.014447697438299656 2023-01-22 17:03:04.606206: step: 592/530, loss: 0.010446269996464252 2023-01-22 17:03:05.722222: step: 596/530, loss: 0.053101733326911926 2023-01-22 17:03:06.817085: step: 600/530, loss: 0.02219861000776291 2023-01-22 17:03:07.931669: step: 604/530, loss: 0.00992828793823719 2023-01-22 17:03:09.026827: step: 608/530, loss: 0.04490850865840912 2023-01-22 17:03:10.152108: step: 612/530, loss: 0.011792284436523914 2023-01-22 17:03:11.241427: step: 616/530, loss: 0.009993292391300201 2023-01-22 17:03:12.363113: step: 620/530, loss: 0.010060536675155163 2023-01-22 17:03:13.425730: step: 624/530, loss: 0.050234872847795486 2023-01-22 17:03:14.540339: step: 628/530, loss: 0.019075261428952217 2023-01-22 17:03:15.607952: step: 632/530, loss: 0.016102146357297897 2023-01-22 17:03:16.714022: step: 636/530, loss: 0.010150427930057049 2023-01-22 17:03:17.821830: step: 640/530, loss: 0.009431491605937481 2023-01-22 17:03:18.914340: step: 644/530, loss: 0.009330429136753082 2023-01-22 17:03:20.023958: step: 648/530, loss: 0.013603986240923405 2023-01-22 17:03:21.125365: step: 652/530, loss: 0.007064360659569502 2023-01-22 17:03:22.212082: step: 656/530, loss: 0.010857746005058289 2023-01-22 17:03:23.292382: step: 660/530, loss: 0.010749378241598606 2023-01-22 17:03:24.378142: step: 664/530, loss: 0.03511538356542587 2023-01-22 17:03:25.478374: step: 668/530, loss: 0.00687797786667943 2023-01-22 17:03:26.593556: step: 672/530, loss: 0.016551679000258446 2023-01-22 17:03:27.705558: step: 676/530, loss: 0.008278360590338707 2023-01-22 17:03:28.823728: step: 680/530, loss: 0.013280468992888927 2023-01-22 17:03:29.921711: step: 684/530, loss: 0.052824780344963074 2023-01-22 17:03:31.033772: step: 688/530, loss: 0.04155043512582779 2023-01-22 17:03:32.126972: step: 692/530, loss: 0.009191321209073067 2023-01-22 17:03:33.214584: step: 696/530, loss: 0.00856541283428669 2023-01-22 17:03:34.311209: step: 700/530, loss: 0.007178144529461861 2023-01-22 17:03:35.403426: step: 704/530, loss: 0.005115367006510496 2023-01-22 17:03:36.491457: step: 708/530, loss: 0.011410994455218315 2023-01-22 17:03:37.583536: step: 712/530, loss: 0.017877524718642235 2023-01-22 17:03:38.701546: step: 716/530, loss: 0.03520526736974716 2023-01-22 17:03:39.789073: step: 720/530, loss: 0.001963396556675434 2023-01-22 17:03:40.873304: step: 724/530, loss: 0.0020664336625486612 2023-01-22 17:03:41.953407: step: 728/530, loss: 0.017566706985235214 2023-01-22 17:03:43.059562: step: 732/530, loss: 0.029703212901949883 2023-01-22 17:03:44.160697: step: 736/530, loss: 0.015074805356562138 2023-01-22 17:03:45.249329: step: 740/530, loss: 0.05114130303263664 2023-01-22 17:03:46.328847: step: 744/530, loss: 0.06399284303188324 2023-01-22 17:03:47.426060: step: 748/530, loss: 0.018372777849435806 2023-01-22 17:03:48.500994: step: 752/530, loss: 0.010410459712147713 2023-01-22 17:03:49.610526: step: 756/530, loss: 0.06911301612854004 2023-01-22 17:03:50.702629: step: 760/530, loss: 0.004994244780391455 2023-01-22 17:03:51.799705: step: 764/530, loss: 0.03868423029780388 2023-01-22 17:03:52.893268: step: 768/530, loss: 0.008029693737626076 2023-01-22 17:03:53.975128: step: 772/530, loss: 0.01988298073410988 2023-01-22 17:03:55.084791: step: 776/530, loss: 0.018982091918587685 2023-01-22 17:03:56.182117: step: 780/530, loss: 0.035353220999240875 2023-01-22 17:03:57.267363: step: 784/530, loss: 0.006461441516876221 2023-01-22 17:03:58.367802: step: 788/530, loss: 0.008811785839498043 2023-01-22 17:03:59.463658: step: 792/530, loss: 0.049760594964027405 2023-01-22 17:04:00.571648: step: 796/530, loss: 0.011513302102684975 2023-01-22 17:04:01.671827: step: 800/530, loss: 0.007470728363841772 2023-01-22 17:04:02.781355: step: 804/530, loss: 0.03038622811436653 2023-01-22 17:04:03.889336: step: 808/530, loss: 0.02139291912317276 2023-01-22 17:04:04.998135: step: 812/530, loss: 0.039839550852775574 2023-01-22 17:04:06.104112: step: 816/530, loss: 0.007161576300859451 2023-01-22 17:04:07.199394: step: 820/530, loss: 0.014159068465232849 2023-01-22 17:04:08.301123: step: 824/530, loss: 0.019974643364548683 2023-01-22 17:04:09.395923: step: 828/530, loss: 0.013316066935658455 2023-01-22 17:04:10.495258: step: 832/530, loss: 0.022347649559378624 2023-01-22 17:04:11.597917: step: 836/530, loss: 0.03583676740527153 2023-01-22 17:04:12.701792: step: 840/530, loss: 0.012776310555636883 2023-01-22 17:04:13.792480: step: 844/530, loss: 0.012068641372025013 2023-01-22 17:04:14.913979: step: 848/530, loss: 0.013448876328766346 2023-01-22 17:04:16.053321: step: 852/530, loss: 0.018185192719101906 2023-01-22 17:04:17.146097: step: 856/530, loss: 0.01383522991091013 2023-01-22 17:04:18.247478: step: 860/530, loss: 0.04743143916130066 2023-01-22 17:04:19.333116: step: 864/530, loss: 0.01881537400186062 2023-01-22 17:04:20.435562: step: 868/530, loss: 0.013506807386875153 2023-01-22 17:04:21.530128: step: 872/530, loss: 0.007484327536076307 2023-01-22 17:04:22.633547: step: 876/530, loss: 0.007950818166136742 2023-01-22 17:04:23.718681: step: 880/530, loss: 0.009719445370137691 2023-01-22 17:04:24.830363: step: 884/530, loss: 0.014991038478910923 2023-01-22 17:04:25.943206: step: 888/530, loss: 0.008596524596214294 2023-01-22 17:04:27.044916: step: 892/530, loss: 0.013084711506962776 2023-01-22 17:04:28.136139: step: 896/530, loss: 0.014744004234671593 2023-01-22 17:04:29.247025: step: 900/530, loss: 0.023029623553156853 2023-01-22 17:04:30.334492: step: 904/530, loss: 0.019510850310325623 2023-01-22 17:04:31.442042: step: 908/530, loss: 0.009823204018175602 2023-01-22 17:04:32.530986: step: 912/530, loss: 0.009708911180496216 2023-01-22 17:04:33.623218: step: 916/530, loss: 0.004477589391171932 2023-01-22 17:04:34.738793: step: 920/530, loss: 0.017420802265405655 2023-01-22 17:04:35.828338: step: 924/530, loss: 0.008795643225312233 2023-01-22 17:04:36.932677: step: 928/530, loss: 0.02314850687980652 2023-01-22 17:04:38.015675: step: 932/530, loss: 0.028379026800394058 2023-01-22 17:04:39.112782: step: 936/530, loss: 0.01130882278084755 2023-01-22 17:04:40.212899: step: 940/530, loss: 0.007444203831255436 2023-01-22 17:04:41.316291: step: 944/530, loss: 0.012078704312443733 2023-01-22 17:04:42.415378: step: 948/530, loss: 0.013832642696797848 2023-01-22 17:04:43.522628: step: 952/530, loss: 0.008240267634391785 2023-01-22 17:04:44.620156: step: 956/530, loss: 0.007556191645562649 2023-01-22 17:04:45.716566: step: 960/530, loss: 0.025990257039666176 2023-01-22 17:04:46.828877: step: 964/530, loss: 0.014192350208759308 2023-01-22 17:04:47.924667: step: 968/530, loss: 0.011100104078650475 2023-01-22 17:04:49.032201: step: 972/530, loss: 0.006428951863199472 2023-01-22 17:04:50.107684: step: 976/530, loss: 0.05296020209789276 2023-01-22 17:04:51.204060: step: 980/530, loss: 0.009439952671527863 2023-01-22 17:04:52.345041: step: 984/530, loss: 0.009728724136948586 2023-01-22 17:04:53.422012: step: 988/530, loss: 0.04730822518467903 2023-01-22 17:04:54.542976: step: 992/530, loss: 0.052044834941625595 2023-01-22 17:04:55.627366: step: 996/530, loss: 0.02639291062951088 2023-01-22 17:04:56.705265: step: 1000/530, loss: 0.008362848311662674 2023-01-22 17:04:57.789358: step: 1004/530, loss: 0.013744687661528587 2023-01-22 17:04:58.856222: step: 1008/530, loss: 0.005262541584670544 2023-01-22 17:04:59.970162: step: 1012/530, loss: 0.011320390738546848 2023-01-22 17:05:01.034853: step: 1016/530, loss: 0.02581048011779785 2023-01-22 17:05:02.127773: step: 1020/530, loss: 0.011062169447541237 2023-01-22 17:05:03.204577: step: 1024/530, loss: 0.026677079498767853 2023-01-22 17:05:04.306039: step: 1028/530, loss: 0.0048840949311852455 2023-01-22 17:05:05.417851: step: 1032/530, loss: 0.011815915815532207 2023-01-22 17:05:06.491213: step: 1036/530, loss: 0.01807076670229435 2023-01-22 17:05:07.595670: step: 1040/530, loss: 0.041602972894907 2023-01-22 17:05:08.685712: step: 1044/530, loss: 0.05111640691757202 2023-01-22 17:05:09.770323: step: 1048/530, loss: 0.007702759001404047 2023-01-22 17:05:10.884694: step: 1052/530, loss: 0.04642478749155998 2023-01-22 17:05:11.978683: step: 1056/530, loss: 0.009657839313149452 2023-01-22 17:05:13.069422: step: 1060/530, loss: 0.008408733643591404 2023-01-22 17:05:14.160204: step: 1064/530, loss: 0.02986236847937107 2023-01-22 17:05:15.253688: step: 1068/530, loss: 0.009164144285023212 2023-01-22 17:05:16.342967: step: 1072/530, loss: 0.009531466290354729 2023-01-22 17:05:17.438203: step: 1076/530, loss: 0.006760431919246912 2023-01-22 17:05:18.533992: step: 1080/530, loss: 0.010862594470381737 2023-01-22 17:05:19.633046: step: 1084/530, loss: 0.011358842253684998 2023-01-22 17:05:20.718613: step: 1088/530, loss: 0.015605390071868896 2023-01-22 17:05:21.806202: step: 1092/530, loss: 0.025138139724731445 2023-01-22 17:05:22.914647: step: 1096/530, loss: 0.06401416659355164 2023-01-22 17:05:24.015638: step: 1100/530, loss: 0.009003587998449802 2023-01-22 17:05:25.077168: step: 1104/530, loss: 0.018553756177425385 2023-01-22 17:05:26.157918: step: 1108/530, loss: 0.009399579837918282 2023-01-22 17:05:27.233382: step: 1112/530, loss: 0.010055833496153355 2023-01-22 17:05:28.318261: step: 1116/530, loss: 0.007202986627817154 2023-01-22 17:05:29.412436: step: 1120/530, loss: 0.018063019961118698 2023-01-22 17:05:30.509141: step: 1124/530, loss: 0.005566895008087158 2023-01-22 17:05:31.604517: step: 1128/530, loss: 0.013489291071891785 2023-01-22 17:05:32.700006: step: 1132/530, loss: 0.018932178616523743 2023-01-22 17:05:33.795904: step: 1136/530, loss: 0.0192992202937603 2023-01-22 17:05:34.894894: step: 1140/530, loss: 0.06442520022392273 2023-01-22 17:05:35.981317: step: 1144/530, loss: 0.017229406163096428 2023-01-22 17:05:37.070202: step: 1148/530, loss: 0.023317674174904823 2023-01-22 17:05:38.162554: step: 1152/530, loss: 0.009954470209777355 2023-01-22 17:05:39.256429: step: 1156/530, loss: 0.015561471693217754 2023-01-22 17:05:40.345184: step: 1160/530, loss: 0.008471912704408169 2023-01-22 17:05:41.454646: step: 1164/530, loss: 0.006097727920860052 2023-01-22 17:05:42.545751: step: 1168/530, loss: 0.02479659393429756 2023-01-22 17:05:43.636341: step: 1172/530, loss: 0.021039575338363647 2023-01-22 17:05:44.721135: step: 1176/530, loss: 0.008313262835144997 2023-01-22 17:05:45.805514: step: 1180/530, loss: 0.014532352797687054 2023-01-22 17:05:46.896953: step: 1184/530, loss: 0.010721875354647636 2023-01-22 17:05:47.991262: step: 1188/530, loss: 0.0011187108466401696 2023-01-22 17:05:49.084357: step: 1192/530, loss: 0.008913950994610786 2023-01-22 17:05:50.176296: step: 1196/530, loss: 0.013864309526979923 2023-01-22 17:05:51.257330: step: 1200/530, loss: 0.021943002939224243 2023-01-22 17:05:52.350212: step: 1204/530, loss: 0.046534888446331024 2023-01-22 17:05:53.451108: step: 1208/530, loss: 0.003053515451028943 2023-01-22 17:05:54.542820: step: 1212/530, loss: 0.027452979236841202 2023-01-22 17:05:55.626216: step: 1216/530, loss: 0.03662760183215141 2023-01-22 17:05:56.729594: step: 1220/530, loss: 0.007847432047128677 2023-01-22 17:05:57.832024: step: 1224/530, loss: 0.04117194935679436 2023-01-22 17:05:58.929632: step: 1228/530, loss: 0.014644318260252476 2023-01-22 17:06:00.021870: step: 1232/530, loss: 0.01593797095119953 2023-01-22 17:06:01.116668: step: 1236/530, loss: 0.014883672818541527 2023-01-22 17:06:02.200754: step: 1240/530, loss: 0.007079263683408499 2023-01-22 17:06:03.293917: step: 1244/530, loss: 0.008620164357125759 2023-01-22 17:06:04.374244: step: 1248/530, loss: 0.01168068964034319 2023-01-22 17:06:05.484617: step: 1252/530, loss: 0.012292832136154175 2023-01-22 17:06:06.574593: step: 1256/530, loss: 0.009831907227635384 2023-01-22 17:06:07.695443: step: 1260/530, loss: 0.0096824262291193 2023-01-22 17:06:08.795650: step: 1264/530, loss: 0.008983486331999302 2023-01-22 17:06:09.889532: step: 1268/530, loss: 0.051251497119665146 2023-01-22 17:06:10.980845: step: 1272/530, loss: 0.015889881178736687 2023-01-22 17:06:12.123272: step: 1276/530, loss: 0.013440173119306564 2023-01-22 17:06:13.207400: step: 1280/530, loss: 0.010372988879680634 2023-01-22 17:06:14.288507: step: 1284/530, loss: 0.03607025742530823 2023-01-22 17:06:15.386865: step: 1288/530, loss: 0.013582274317741394 2023-01-22 17:06:16.503604: step: 1292/530, loss: 0.04075070098042488 2023-01-22 17:06:17.584021: step: 1296/530, loss: 0.004589695017784834 2023-01-22 17:06:18.682876: step: 1300/530, loss: 0.011066440492868423 2023-01-22 17:06:19.758298: step: 1304/530, loss: 0.012043549679219723 2023-01-22 17:06:20.850999: step: 1308/530, loss: 0.001740098581649363 2023-01-22 17:06:21.944615: step: 1312/530, loss: 0.013796101324260235 2023-01-22 17:06:23.021807: step: 1316/530, loss: 0.052267950028181076 2023-01-22 17:06:24.113441: step: 1320/530, loss: 0.0011448016157373786 2023-01-22 17:06:25.194380: step: 1324/530, loss: 0.013321767561137676 2023-01-22 17:06:26.294296: step: 1328/530, loss: 0.0713484063744545 2023-01-22 17:06:27.386118: step: 1332/530, loss: 0.014469791203737259 2023-01-22 17:06:28.472123: step: 1336/530, loss: 0.011115959845483303 2023-01-22 17:06:29.577162: step: 1340/530, loss: 0.034775689244270325 2023-01-22 17:06:30.672818: step: 1344/530, loss: 0.03947098180651665 2023-01-22 17:06:31.759960: step: 1348/530, loss: 0.033898014575242996 2023-01-22 17:06:32.838079: step: 1352/530, loss: 0.02264307253062725 2023-01-22 17:06:33.928129: step: 1356/530, loss: 0.011270228773355484 2023-01-22 17:06:35.032576: step: 1360/530, loss: 0.009110105223953724 2023-01-22 17:06:36.119717: step: 1364/530, loss: 0.004825693555176258 2023-01-22 17:06:37.212891: step: 1368/530, loss: 0.00863538309931755 2023-01-22 17:06:38.303900: step: 1372/530, loss: 0.08705249428749084 2023-01-22 17:06:39.386328: step: 1376/530, loss: 0.036806944757699966 2023-01-22 17:06:40.509284: step: 1380/530, loss: 0.016920851543545723 2023-01-22 17:06:41.587475: step: 1384/530, loss: 0.013329208828508854 2023-01-22 17:06:42.658285: step: 1388/530, loss: 0.014396107755601406 2023-01-22 17:06:43.750636: step: 1392/530, loss: 0.05370703712105751 2023-01-22 17:06:44.838102: step: 1396/530, loss: 0.015506411902606487 2023-01-22 17:06:45.944630: step: 1400/530, loss: 0.016293397173285484 2023-01-22 17:06:47.029765: step: 1404/530, loss: 0.008619780652225018 2023-01-22 17:06:48.127126: step: 1408/530, loss: 0.017172975465655327 2023-01-22 17:06:49.226555: step: 1412/530, loss: 0.017536213621497154 2023-01-22 17:06:50.304711: step: 1416/530, loss: 0.013121065683662891 2023-01-22 17:06:51.382143: step: 1420/530, loss: 0.009021638892591 2023-01-22 17:06:52.483844: step: 1424/530, loss: 0.019467992708086967 2023-01-22 17:06:53.565481: step: 1428/530, loss: 0.0451773963868618 2023-01-22 17:06:54.675438: step: 1432/530, loss: 0.0163405891507864 2023-01-22 17:06:55.776262: step: 1436/530, loss: 0.006332543212920427 2023-01-22 17:06:56.871271: step: 1440/530, loss: 0.013158321380615234 2023-01-22 17:06:57.955797: step: 1444/530, loss: 0.010919002816081047 2023-01-22 17:06:59.051680: step: 1448/530, loss: 0.005222956649959087 2023-01-22 17:07:00.139616: step: 1452/530, loss: 0.007199855521321297 2023-01-22 17:07:01.244088: step: 1456/530, loss: 0.0466931015253067 2023-01-22 17:07:02.355713: step: 1460/530, loss: 0.02764984965324402 2023-01-22 17:07:03.448982: step: 1464/530, loss: 0.015452233143150806 2023-01-22 17:07:04.530440: step: 1468/530, loss: 0.013781887479126453 2023-01-22 17:07:05.609461: step: 1472/530, loss: 0.008006605319678783 2023-01-22 17:07:06.711032: step: 1476/530, loss: 0.009298715740442276 2023-01-22 17:07:07.828228: step: 1480/530, loss: 0.017962105572223663 2023-01-22 17:07:08.926876: step: 1484/530, loss: 0.04525889456272125 2023-01-22 17:07:10.013620: step: 1488/530, loss: 0.0073051913641393185 2023-01-22 17:07:11.119350: step: 1492/530, loss: 0.006594618316739798 2023-01-22 17:07:12.229034: step: 1496/530, loss: 0.03404797613620758 2023-01-22 17:07:13.309143: step: 1500/530, loss: 0.006146298721432686 2023-01-22 17:07:14.401739: step: 1504/530, loss: 0.0053114937618374825 2023-01-22 17:07:15.488152: step: 1508/530, loss: 0.007468213327229023 2023-01-22 17:07:16.581847: step: 1512/530, loss: 0.016199523583054543 2023-01-22 17:07:17.656386: step: 1516/530, loss: 0.009386864490807056 2023-01-22 17:07:18.737056: step: 1520/530, loss: 0.040742166340351105 2023-01-22 17:07:19.810169: step: 1524/530, loss: 0.01466831099241972 2023-01-22 17:07:20.905017: step: 1528/530, loss: 0.06471836566925049 2023-01-22 17:07:21.996143: step: 1532/530, loss: 0.06189916282892227 2023-01-22 17:07:23.081011: step: 1536/530, loss: 0.005648388527333736 2023-01-22 17:07:24.162724: step: 1540/530, loss: 0.005295681767165661 2023-01-22 17:07:25.241867: step: 1544/530, loss: 0.038363661617040634 2023-01-22 17:07:26.336862: step: 1548/530, loss: 0.01912683993577957 2023-01-22 17:07:27.456489: step: 1552/530, loss: 0.02115822024643421 2023-01-22 17:07:28.541932: step: 1556/530, loss: 0.006661378778517246 2023-01-22 17:07:29.625343: step: 1560/530, loss: 0.0025027559604495764 2023-01-22 17:07:30.721697: step: 1564/530, loss: 0.028140855953097343 2023-01-22 17:07:31.824462: step: 1568/530, loss: 0.05170895904302597 2023-01-22 17:07:32.914811: step: 1572/530, loss: 0.015366709791123867 2023-01-22 17:07:34.007070: step: 1576/530, loss: 0.0493619404733181 2023-01-22 17:07:35.105942: step: 1580/530, loss: 0.006609445903450251 2023-01-22 17:07:36.203598: step: 1584/530, loss: 0.086870476603508 2023-01-22 17:07:37.290945: step: 1588/530, loss: 0.004183044657111168 2023-01-22 17:07:38.419276: step: 1592/530, loss: 0.02441703900694847 2023-01-22 17:07:39.496304: step: 1596/530, loss: 0.005866901483386755 2023-01-22 17:07:40.595995: step: 1600/530, loss: 0.006879615597426891 2023-01-22 17:07:41.681715: step: 1604/530, loss: 0.011241494677960873 2023-01-22 17:07:42.816177: step: 1608/530, loss: 0.006326948292553425 2023-01-22 17:07:43.934602: step: 1612/530, loss: 0.08572746813297272 2023-01-22 17:07:45.032697: step: 1616/530, loss: 0.04401139169931412 2023-01-22 17:07:46.114392: step: 1620/530, loss: 0.010090016759932041 2023-01-22 17:07:47.192559: step: 1624/530, loss: 0.027341250330209732 2023-01-22 17:07:48.276873: step: 1628/530, loss: 0.05105701833963394 2023-01-22 17:07:49.349703: step: 1632/530, loss: 0.0067165750078856945 2023-01-22 17:07:50.462849: step: 1636/530, loss: 0.008871729485690594 2023-01-22 17:07:51.569490: step: 1640/530, loss: 0.010072163306176662 2023-01-22 17:07:52.658885: step: 1644/530, loss: 0.017721718177199364 2023-01-22 17:07:53.783244: step: 1648/530, loss: 0.014519420452415943 2023-01-22 17:07:54.860028: step: 1652/530, loss: 0.003179592080414295 2023-01-22 17:07:55.951130: step: 1656/530, loss: 0.0170866921544075 2023-01-22 17:07:57.029668: step: 1660/530, loss: 0.004248795565217733 2023-01-22 17:07:58.130290: step: 1664/530, loss: 0.041401106864213943 2023-01-22 17:07:59.258396: step: 1668/530, loss: 0.010224878787994385 2023-01-22 17:08:00.350021: step: 1672/530, loss: 0.005794689524918795 2023-01-22 17:08:01.432972: step: 1676/530, loss: 0.004830840975046158 2023-01-22 17:08:02.513965: step: 1680/530, loss: 0.046073660254478455 2023-01-22 17:08:03.585308: step: 1684/530, loss: 0.02316979132592678 2023-01-22 17:08:04.676196: step: 1688/530, loss: 0.011960898526012897 2023-01-22 17:08:05.770402: step: 1692/530, loss: 0.005457218736410141 2023-01-22 17:08:06.875004: step: 1696/530, loss: 0.023861417546868324 2023-01-22 17:08:07.949568: step: 1700/530, loss: 0.007934191264212132 2023-01-22 17:08:09.052276: step: 1704/530, loss: 0.0192751195281744 2023-01-22 17:08:10.147417: step: 1708/530, loss: 0.009477551095187664 2023-01-22 17:08:11.231949: step: 1712/530, loss: 0.011693878099322319 2023-01-22 17:08:12.344133: step: 1716/530, loss: 0.012986032292246819 2023-01-22 17:08:13.427630: step: 1720/530, loss: 0.04070911556482315 2023-01-22 17:08:14.512053: step: 1724/530, loss: 0.04441099613904953 2023-01-22 17:08:15.606425: step: 1728/530, loss: 0.03590861335396767 2023-01-22 17:08:16.710315: step: 1732/530, loss: 0.007922603748738766 2023-01-22 17:08:17.797059: step: 1736/530, loss: 0.015488187782466412 2023-01-22 17:08:18.874498: step: 1740/530, loss: 0.05255468189716339 2023-01-22 17:08:19.974414: step: 1744/530, loss: 0.05340617895126343 2023-01-22 17:08:21.056636: step: 1748/530, loss: 0.016160784289240837 2023-01-22 17:08:22.147421: step: 1752/530, loss: 0.011097296141088009 2023-01-22 17:08:23.225853: step: 1756/530, loss: 0.04077597334980965 2023-01-22 17:08:24.318572: step: 1760/530, loss: 0.02521529048681259 2023-01-22 17:08:25.414801: step: 1764/530, loss: 0.016891025006771088 2023-01-22 17:08:26.496627: step: 1768/530, loss: 0.021420054137706757 2023-01-22 17:08:27.581758: step: 1772/530, loss: 0.014504202641546726 2023-01-22 17:08:28.682191: step: 1776/530, loss: 0.013056584633886814 2023-01-22 17:08:29.774793: step: 1780/530, loss: 0.008672324940562248 2023-01-22 17:08:30.889536: step: 1784/530, loss: 0.05655907839536667 2023-01-22 17:08:31.970453: step: 1788/530, loss: 0.011442478746175766 2023-01-22 17:08:33.031894: step: 1792/530, loss: 0.023429814726114273 2023-01-22 17:08:34.118900: step: 1796/530, loss: 0.006677787285298109 2023-01-22 17:08:35.206110: step: 1800/530, loss: 0.02389880083501339 2023-01-22 17:08:36.284948: step: 1804/530, loss: 0.014673844911158085 2023-01-22 17:08:37.375758: step: 1808/530, loss: 0.011427624151110649 2023-01-22 17:08:38.455289: step: 1812/530, loss: 0.017208192497491837 2023-01-22 17:08:39.550650: step: 1816/530, loss: 0.009373791515827179 2023-01-22 17:08:40.623357: step: 1820/530, loss: 0.010688582435250282 2023-01-22 17:08:41.709988: step: 1824/530, loss: 0.011597719043493271 2023-01-22 17:08:42.797615: step: 1828/530, loss: 0.011483196169137955 2023-01-22 17:08:43.880249: step: 1832/530, loss: 0.0057946061715483665 2023-01-22 17:08:44.959965: step: 1836/530, loss: 0.016938593238592148 2023-01-22 17:08:46.041630: step: 1840/530, loss: 0.021978773176670074 2023-01-22 17:08:47.108045: step: 1844/530, loss: 0.011688240803778172 2023-01-22 17:08:48.211066: step: 1848/530, loss: 0.020980799570679665 2023-01-22 17:08:49.289100: step: 1852/530, loss: 0.005678862798959017 2023-01-22 17:08:50.362829: step: 1856/530, loss: 0.007353747729212046 2023-01-22 17:08:51.465471: step: 1860/530, loss: 0.016599297523498535 2023-01-22 17:08:52.539201: step: 1864/530, loss: 0.011584038846194744 2023-01-22 17:08:53.644985: step: 1868/530, loss: 0.011547436937689781 2023-01-22 17:08:54.721731: step: 1872/530, loss: 0.011611199006438255 2023-01-22 17:08:55.806860: step: 1876/530, loss: 0.005899867508560419 2023-01-22 17:08:56.890126: step: 1880/530, loss: 0.020347844809293747 2023-01-22 17:08:57.994972: step: 1884/530, loss: 0.041970983147621155 2023-01-22 17:08:59.088073: step: 1888/530, loss: 0.023819850757718086 2023-01-22 17:09:00.178214: step: 1892/530, loss: 0.021984515711665154 2023-01-22 17:09:01.289563: step: 1896/530, loss: 0.006055832374840975 2023-01-22 17:09:02.412207: step: 1900/530, loss: 0.002389435190707445 2023-01-22 17:09:03.494853: step: 1904/530, loss: 0.02583673968911171 2023-01-22 17:09:04.573017: step: 1908/530, loss: 0.013413617387413979 2023-01-22 17:09:05.658825: step: 1912/530, loss: 0.005588800646364689 2023-01-22 17:09:06.730913: step: 1916/530, loss: 0.015275241807103157 2023-01-22 17:09:07.796792: step: 1920/530, loss: 0.007640031632035971 2023-01-22 17:09:08.920686: step: 1924/530, loss: 0.008493843488395214 2023-01-22 17:09:10.017287: step: 1928/530, loss: 0.014558842405676842 2023-01-22 17:09:11.121267: step: 1932/530, loss: 0.015088051557540894 2023-01-22 17:09:12.198760: step: 1936/530, loss: 0.01971045881509781 2023-01-22 17:09:13.284578: step: 1940/530, loss: 0.007974453270435333 2023-01-22 17:09:14.381875: step: 1944/530, loss: 0.031929511576890945 2023-01-22 17:09:15.490394: step: 1948/530, loss: 0.03817980736494064 2023-01-22 17:09:16.550820: step: 1952/530, loss: 0.014736795797944069 2023-01-22 17:09:17.655676: step: 1956/530, loss: 0.01946777105331421 2023-01-22 17:09:18.774487: step: 1960/530, loss: 0.04873862862586975 2023-01-22 17:09:19.896191: step: 1964/530, loss: 0.04807610437273979 2023-01-22 17:09:20.975271: step: 1968/530, loss: 0.005408183671534061 2023-01-22 17:09:22.054195: step: 1972/530, loss: 0.003873688168823719 2023-01-22 17:09:23.141917: step: 1976/530, loss: 0.007736499886959791 2023-01-22 17:09:24.238120: step: 1980/530, loss: 0.00979442335665226 2023-01-22 17:09:25.330155: step: 1984/530, loss: 0.005270025227218866 2023-01-22 17:09:26.409619: step: 1988/530, loss: 0.0016902843490242958 2023-01-22 17:09:27.503657: step: 1992/530, loss: 0.016470305621623993 2023-01-22 17:09:28.584492: step: 1996/530, loss: 0.016909243538975716 2023-01-22 17:09:29.688280: step: 2000/530, loss: 0.01853897050023079 2023-01-22 17:09:30.803190: step: 2004/530, loss: 0.042839545756578445 2023-01-22 17:09:31.911262: step: 2008/530, loss: 0.007836148142814636 2023-01-22 17:09:33.000573: step: 2012/530, loss: 0.04640832543373108 2023-01-22 17:09:34.120921: step: 2016/530, loss: 0.007148121017962694 2023-01-22 17:09:35.219983: step: 2020/530, loss: 0.04487069696187973 2023-01-22 17:09:36.317932: step: 2024/530, loss: 0.014467395842075348 2023-01-22 17:09:37.408132: step: 2028/530, loss: 0.01731143891811371 2023-01-22 17:09:38.489458: step: 2032/530, loss: 0.01316429115831852 2023-01-22 17:09:39.579196: step: 2036/530, loss: 0.04857649281620979 2023-01-22 17:09:40.667851: step: 2040/530, loss: 0.013822689652442932 2023-01-22 17:09:41.751283: step: 2044/530, loss: 0.05104544386267662 2023-01-22 17:09:42.850448: step: 2048/530, loss: 0.06270679086446762 2023-01-22 17:09:43.937137: step: 2052/530, loss: 0.010346686467528343 2023-01-22 17:09:45.063489: step: 2056/530, loss: 0.007750852964818478 2023-01-22 17:09:46.155416: step: 2060/530, loss: 0.008350764401257038 2023-01-22 17:09:47.241652: step: 2064/530, loss: 0.008360866457223892 2023-01-22 17:09:48.311975: step: 2068/530, loss: 0.04624565690755844 2023-01-22 17:09:49.372589: step: 2072/530, loss: 0.030611254274845123 2023-01-22 17:09:50.462625: step: 2076/530, loss: 0.02276519685983658 2023-01-22 17:09:51.523652: step: 2080/530, loss: 0.010013825260102749 2023-01-22 17:09:52.612659: step: 2084/530, loss: 0.03413398936390877 2023-01-22 17:09:53.685954: step: 2088/530, loss: 0.01107659749686718 2023-01-22 17:09:54.775865: step: 2092/530, loss: 0.008314614184200764 2023-01-22 17:09:55.861848: step: 2096/530, loss: 0.009954916313290596 2023-01-22 17:09:56.966911: step: 2100/530, loss: 0.04503287002444267 2023-01-22 17:09:58.057306: step: 2104/530, loss: 0.012182024307549 2023-01-22 17:09:59.136324: step: 2108/530, loss: 0.0066059851087629795 2023-01-22 17:10:00.207169: step: 2112/530, loss: 0.003165996866300702 2023-01-22 17:10:01.288877: step: 2116/530, loss: 0.02666446566581726 2023-01-22 17:10:02.399681: step: 2120/530, loss: 0.010328611359000206 ================================================== Loss: 0.022 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.330457410236822, 'r': 0.35177724315532666, 'f1': 0.34078420430672274}, 'combined': 0.2511041505417957, 'stategy': 1, 'epoch': 0} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3164748486044226, 'r': 0.28704988740875914, 'f1': 0.30104505826789996}, 'combined': 0.18696482566111683, 'stategy': 1, 'epoch': 0} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3385985644584724, 'r': 0.339883568498163, 'f1': 0.3392398496184316}, 'combined': 0.24996620498200223, 'stategy': 1, 'epoch': 0} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3012709339693999, 'r': 0.28488131837264724, 'f1': 0.29284698817971155}, 'combined': 0.18187339265897876, 'stategy': 1, 'epoch': 0} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3350544445433109, 'r': 0.32233890585096514, 'f1': 0.32857370093512306}, 'combined': 0.2421069375311433, 'stategy': 1, 'epoch': 0} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3252510122348801, 'r': 0.289932541014903, 'f1': 0.3065779374197252}, 'combined': 0.1904010348185662, 'stategy': 1, 'epoch': 0} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 0} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3357142857142857, 'r': 0.5108695652173914, 'f1': 0.4051724137931034}, 'combined': 0.2025862068965517, 'stategy': 1, 'epoch': 0} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 0} New best chinese model... New best korean model... New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.330457410236822, 'r': 0.35177724315532666, 'f1': 0.34078420430672274}, 'combined': 0.2511041505417957, 'stategy': 1, 'epoch': 0} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3164748486044226, 'r': 0.28704988740875914, 'f1': 0.30104505826789996}, 'combined': 0.18696482566111683, 'stategy': 1, 'epoch': 0} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 0} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3385985644584724, 'r': 0.339883568498163, 'f1': 0.3392398496184316}, 'combined': 0.24996620498200223, 'stategy': 1, 'epoch': 0} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3012709339693999, 'r': 0.28488131837264724, 'f1': 0.29284698817971155}, 'combined': 0.18187339265897876, 'stategy': 1, 'epoch': 0} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3357142857142857, 'r': 0.5108695652173914, 'f1': 0.4051724137931034}, 'combined': 0.2025862068965517, 'stategy': 1, 'epoch': 0} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3350544445433109, 'r': 0.32233890585096514, 'f1': 0.32857370093512306}, 'combined': 0.2421069375311433, 'stategy': 1, 'epoch': 0} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3252510122348801, 'r': 0.289932541014903, 'f1': 0.3065779374197252}, 'combined': 0.1904010348185662, 'stategy': 1, 'epoch': 0} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 0} ****************************** Epoch: 1 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 17:13:01.737365: step: 4/530, loss: 0.005641673691570759 2023-01-22 17:13:02.822053: step: 8/530, loss: 0.02767476812005043 2023-01-22 17:13:03.896255: step: 12/530, loss: 0.006464339327067137 2023-01-22 17:13:05.004839: step: 16/530, loss: 0.006023034919053316 2023-01-22 17:13:06.075019: step: 20/530, loss: 0.002565554343163967 2023-01-22 17:13:07.149697: step: 24/530, loss: 0.007445499766618013 2023-01-22 17:13:08.219606: step: 28/530, loss: 0.03772822394967079 2023-01-22 17:13:09.304393: step: 32/530, loss: 0.012982611544430256 2023-01-22 17:13:10.397442: step: 36/530, loss: 0.009248163551092148 2023-01-22 17:13:11.490494: step: 40/530, loss: 0.013611535541713238 2023-01-22 17:13:12.564589: step: 44/530, loss: 0.0074456194415688515 2023-01-22 17:13:13.666458: step: 48/530, loss: 0.01183254737406969 2023-01-22 17:13:14.740344: step: 52/530, loss: 0.00836742203682661 2023-01-22 17:13:15.829869: step: 56/530, loss: 0.029643826186656952 2023-01-22 17:13:16.910103: step: 60/530, loss: 0.0018335202476009727 2023-01-22 17:13:18.009205: step: 64/530, loss: 0.009220931679010391 2023-01-22 17:13:19.090431: step: 68/530, loss: 0.0027676185127347708 2023-01-22 17:13:20.158518: step: 72/530, loss: 0.045051395893096924 2023-01-22 17:13:21.239554: step: 76/530, loss: 0.024673137813806534 2023-01-22 17:13:22.325269: step: 80/530, loss: 0.015320098027586937 2023-01-22 17:13:23.409800: step: 84/530, loss: 0.012221215292811394 2023-01-22 17:13:24.480204: step: 88/530, loss: 0.031142128631472588 2023-01-22 17:13:25.565576: step: 92/530, loss: 0.012339354492723942 2023-01-22 17:13:26.651818: step: 96/530, loss: 0.03250077739357948 2023-01-22 17:13:27.751215: step: 100/530, loss: 0.013919645920395851 2023-01-22 17:13:28.847170: step: 104/530, loss: 0.011967160739004612 2023-01-22 17:13:29.940087: step: 108/530, loss: 0.009652109816670418 2023-01-22 17:13:31.036344: step: 112/530, loss: 0.008104892447590828 2023-01-22 17:13:32.125684: step: 116/530, loss: 0.023436369374394417 2023-01-22 17:13:33.219651: step: 120/530, loss: 0.007483702152967453 2023-01-22 17:13:34.318901: step: 124/530, loss: 0.011638524010777473 2023-01-22 17:13:35.412880: step: 128/530, loss: 0.011519819498062134 2023-01-22 17:13:36.500279: step: 132/530, loss: 0.02385181561112404 2023-01-22 17:13:37.590621: step: 136/530, loss: 0.018908152356743813 2023-01-22 17:13:38.709336: step: 140/530, loss: 0.010773095302283764 2023-01-22 17:13:39.797937: step: 144/530, loss: 0.013346029445528984 2023-01-22 17:13:40.868053: step: 148/530, loss: 0.004396419040858746 2023-01-22 17:13:41.959428: step: 152/530, loss: 0.024951230734586716 2023-01-22 17:13:43.059868: step: 156/530, loss: 0.039059292525053024 2023-01-22 17:13:44.143123: step: 160/530, loss: 0.00906367413699627 2023-01-22 17:13:45.238594: step: 164/530, loss: 0.006897334475070238 2023-01-22 17:13:46.349660: step: 168/530, loss: 0.04623740538954735 2023-01-22 17:13:47.433002: step: 172/530, loss: 0.01330616045743227 2023-01-22 17:13:48.497352: step: 176/530, loss: 0.020469974726438522 2023-01-22 17:13:49.571955: step: 180/530, loss: 0.016315195709466934 2023-01-22 17:13:50.655429: step: 184/530, loss: 0.009510687552392483 2023-01-22 17:13:51.764694: step: 188/530, loss: 0.030139977112412453 2023-01-22 17:13:52.836141: step: 192/530, loss: 0.03469419106841087 2023-01-22 17:13:53.922566: step: 196/530, loss: 0.011470895260572433 2023-01-22 17:13:55.003169: step: 200/530, loss: 0.004861598368734121 2023-01-22 17:13:56.097060: step: 204/530, loss: 0.02003544010221958 2023-01-22 17:13:57.203269: step: 208/530, loss: 0.013560621067881584 2023-01-22 17:13:58.332220: step: 212/530, loss: 0.021602347493171692 2023-01-22 17:13:59.425056: step: 216/530, loss: 0.03374919667840004 2023-01-22 17:14:00.510094: step: 220/530, loss: 0.033289119601249695 2023-01-22 17:14:01.581224: step: 224/530, loss: 0.04721187427639961 2023-01-22 17:14:02.697803: step: 228/530, loss: 0.013874021358788013 2023-01-22 17:14:03.786735: step: 232/530, loss: 0.010972077958285809 2023-01-22 17:14:04.860102: step: 236/530, loss: 0.010974066331982613 2023-01-22 17:14:05.944987: step: 240/530, loss: 0.021125182509422302 2023-01-22 17:14:07.037365: step: 244/530, loss: 0.008498281240463257 2023-01-22 17:14:08.113615: step: 248/530, loss: 0.00769105413928628 2023-01-22 17:14:09.202568: step: 252/530, loss: 0.012197794392704964 2023-01-22 17:14:10.279069: step: 256/530, loss: 0.011553655378520489 2023-01-22 17:14:11.364426: step: 260/530, loss: 0.012967188842594624 2023-01-22 17:14:12.440652: step: 264/530, loss: 0.009487172588706017 2023-01-22 17:14:13.525258: step: 268/530, loss: 0.003814895171672106 2023-01-22 17:14:14.612620: step: 272/530, loss: 0.0024984669871628284 2023-01-22 17:14:15.691345: step: 276/530, loss: 0.010408744215965271 2023-01-22 17:14:16.767331: step: 280/530, loss: 0.006640077568590641 2023-01-22 17:14:17.860958: step: 284/530, loss: 0.0037364831659942865 2023-01-22 17:14:18.953278: step: 288/530, loss: 0.02296803705394268 2023-01-22 17:14:20.022273: step: 292/530, loss: 0.005384999327361584 2023-01-22 17:14:21.108743: step: 296/530, loss: 0.004077731631696224 2023-01-22 17:14:22.179701: step: 300/530, loss: 0.006421379745006561 2023-01-22 17:14:23.249329: step: 304/530, loss: 0.006202185992151499 2023-01-22 17:14:24.337407: step: 308/530, loss: 0.026412248611450195 2023-01-22 17:14:25.457195: step: 312/530, loss: 0.060694605112075806 2023-01-22 17:14:26.551515: step: 316/530, loss: 0.020239736884832382 2023-01-22 17:14:27.648848: step: 320/530, loss: 0.005850775167346001 2023-01-22 17:14:28.753607: step: 324/530, loss: 0.005612388718873262 2023-01-22 17:14:29.848715: step: 328/530, loss: 0.040948543697595596 2023-01-22 17:14:30.957696: step: 332/530, loss: 0.006373019888997078 2023-01-22 17:14:32.028442: step: 336/530, loss: 0.02074727974832058 2023-01-22 17:14:33.109587: step: 340/530, loss: 0.01446513645350933 2023-01-22 17:14:34.229306: step: 344/530, loss: 0.03704356774687767 2023-01-22 17:14:35.341121: step: 348/530, loss: 0.016241004690527916 2023-01-22 17:14:36.420043: step: 352/530, loss: 0.014843384735286236 2023-01-22 17:14:37.521950: step: 356/530, loss: 0.005968667101114988 2023-01-22 17:14:38.610264: step: 360/530, loss: 0.021548090502619743 2023-01-22 17:14:39.713875: step: 364/530, loss: 0.010564169846475124 2023-01-22 17:14:40.809862: step: 368/530, loss: 0.008715122006833553 2023-01-22 17:14:41.895011: step: 372/530, loss: 0.044845305383205414 2023-01-22 17:14:42.991625: step: 376/530, loss: 0.005612906068563461 2023-01-22 17:14:44.092916: step: 380/530, loss: 0.015625333413481712 2023-01-22 17:14:45.188917: step: 384/530, loss: 0.003909599035978317 2023-01-22 17:14:46.274407: step: 388/530, loss: 0.007939442060887814 2023-01-22 17:14:47.364103: step: 392/530, loss: 0.012792473658919334 2023-01-22 17:14:48.474823: step: 396/530, loss: 0.004712843336164951 2023-01-22 17:14:49.560481: step: 400/530, loss: 0.046316131949424744 2023-01-22 17:14:50.679045: step: 404/530, loss: 0.019022682681679726 2023-01-22 17:14:51.769578: step: 408/530, loss: 0.06996455043554306 2023-01-22 17:14:52.873658: step: 412/530, loss: 0.00816689059138298 2023-01-22 17:14:53.978730: step: 416/530, loss: 0.003402122063562274 2023-01-22 17:14:55.090389: step: 420/530, loss: 0.022883590310811996 2023-01-22 17:14:56.188122: step: 424/530, loss: 0.006130310241132975 2023-01-22 17:14:57.299593: step: 428/530, loss: 0.020629115402698517 2023-01-22 17:14:58.409903: step: 432/530, loss: 0.10651036351919174 2023-01-22 17:14:59.529674: step: 436/530, loss: 0.002941350219771266 2023-01-22 17:15:00.626611: step: 440/530, loss: 0.03869142010807991 2023-01-22 17:15:01.742310: step: 444/530, loss: 0.015508608892560005 2023-01-22 17:15:02.849903: step: 448/530, loss: 0.013619472272694111 2023-01-22 17:15:03.971492: step: 452/530, loss: 0.006740827113389969 2023-01-22 17:15:05.042548: step: 456/530, loss: 0.00532924197614193 2023-01-22 17:15:06.153879: step: 460/530, loss: 0.024177664890885353 2023-01-22 17:15:07.230080: step: 464/530, loss: 0.001887515769340098 2023-01-22 17:15:08.304577: step: 468/530, loss: 0.015710581094026566 2023-01-22 17:15:09.396171: step: 472/530, loss: 0.005297767464071512 2023-01-22 17:15:10.490430: step: 476/530, loss: 0.024334866553544998 2023-01-22 17:15:11.594244: step: 480/530, loss: 0.004942451138049364 2023-01-22 17:15:12.698561: step: 484/530, loss: 0.026859039440751076 2023-01-22 17:15:13.792037: step: 488/530, loss: 0.005093375686556101 2023-01-22 17:15:14.879152: step: 492/530, loss: 0.03999800980091095 2023-01-22 17:15:15.954288: step: 496/530, loss: 0.00826770719140768 2023-01-22 17:15:17.068550: step: 500/530, loss: 0.005403068382292986 2023-01-22 17:15:18.171261: step: 504/530, loss: 0.04293103888630867 2023-01-22 17:15:19.254408: step: 508/530, loss: 0.010611155070364475 2023-01-22 17:15:20.361225: step: 512/530, loss: 0.020945990458130836 2023-01-22 17:15:21.483177: step: 516/530, loss: 0.01142231747508049 2023-01-22 17:15:22.592318: step: 520/530, loss: 0.01530852634459734 2023-01-22 17:15:23.684592: step: 524/530, loss: 0.01927567832171917 2023-01-22 17:15:24.769974: step: 528/530, loss: 0.01029086671769619 2023-01-22 17:15:25.876616: step: 532/530, loss: 0.05991935729980469 2023-01-22 17:15:26.957267: step: 536/530, loss: 0.00935330055654049 2023-01-22 17:15:28.059104: step: 540/530, loss: 0.012328356504440308 2023-01-22 17:15:29.149698: step: 544/530, loss: 0.008024824783205986 2023-01-22 17:15:30.229217: step: 548/530, loss: 0.007618793286383152 2023-01-22 17:15:31.317602: step: 552/530, loss: 0.0005801370134577155 2023-01-22 17:15:32.421102: step: 556/530, loss: 0.020705144852399826 2023-01-22 17:15:33.504307: step: 560/530, loss: 0.05678887292742729 2023-01-22 17:15:34.606608: step: 564/530, loss: 0.004876886494457722 2023-01-22 17:15:35.719746: step: 568/530, loss: 0.03397480398416519 2023-01-22 17:15:36.833959: step: 572/530, loss: 0.01163378357887268 2023-01-22 17:15:37.904108: step: 576/530, loss: 0.02361510507762432 2023-01-22 17:15:39.028602: step: 580/530, loss: 0.030911602079868317 2023-01-22 17:15:40.138807: step: 584/530, loss: 0.000158442446263507 2023-01-22 17:15:41.229534: step: 588/530, loss: 0.005778936203569174 2023-01-22 17:15:42.340057: step: 592/530, loss: 0.004600215703248978 2023-01-22 17:15:43.410724: step: 596/530, loss: 0.004718068987131119 2023-01-22 17:15:44.502620: step: 600/530, loss: 0.004555044695734978 2023-01-22 17:15:45.602061: step: 604/530, loss: 0.013402585871517658 2023-01-22 17:15:46.703397: step: 608/530, loss: 0.009843009524047375 2023-01-22 17:15:47.785670: step: 612/530, loss: 0.00898763444274664 2023-01-22 17:15:48.889234: step: 616/530, loss: 0.008238019421696663 2023-01-22 17:15:49.997450: step: 620/530, loss: 0.03368796408176422 2023-01-22 17:15:51.086511: step: 624/530, loss: 0.008473996073007584 2023-01-22 17:15:52.153117: step: 628/530, loss: 0.007081137038767338 2023-01-22 17:15:53.263364: step: 632/530, loss: 0.011353718116879463 2023-01-22 17:15:54.348878: step: 636/530, loss: 0.030242454260587692 2023-01-22 17:15:55.459953: step: 640/530, loss: 0.008260573260486126 2023-01-22 17:15:56.550305: step: 644/530, loss: 0.015393915586173534 2023-01-22 17:15:57.656445: step: 648/530, loss: 0.0032675284892320633 2023-01-22 17:15:58.750402: step: 652/530, loss: 0.012374993413686752 2023-01-22 17:15:59.850699: step: 656/530, loss: 0.00668248301371932 2023-01-22 17:16:00.962023: step: 660/530, loss: 0.0027193506248295307 2023-01-22 17:16:02.037428: step: 664/530, loss: 0.007382545154541731 2023-01-22 17:16:03.110088: step: 668/530, loss: 0.0024907432962208986 2023-01-22 17:16:04.214306: step: 672/530, loss: 0.00687566539272666 2023-01-22 17:16:05.309366: step: 676/530, loss: 0.012593916617333889 2023-01-22 17:16:06.398660: step: 680/530, loss: 0.023399043828248978 2023-01-22 17:16:07.498647: step: 684/530, loss: 0.009080097079277039 2023-01-22 17:16:08.597842: step: 688/530, loss: 0.006220946088433266 2023-01-22 17:16:09.714929: step: 692/530, loss: 0.09992773830890656 2023-01-22 17:16:10.814039: step: 696/530, loss: 0.005490303970873356 2023-01-22 17:16:11.908593: step: 700/530, loss: 0.02275363728404045 2023-01-22 17:16:13.017893: step: 704/530, loss: 0.00788944959640503 2023-01-22 17:16:14.141275: step: 708/530, loss: 0.08822882920503616 2023-01-22 17:16:15.252848: step: 712/530, loss: 0.05410638451576233 2023-01-22 17:16:16.334145: step: 716/530, loss: 0.00497577665373683 2023-01-22 17:16:17.415895: step: 720/530, loss: 0.04873286560177803 2023-01-22 17:16:18.513866: step: 724/530, loss: 0.004274641629308462 2023-01-22 17:16:19.602659: step: 728/530, loss: 0.005349225830286741 2023-01-22 17:16:20.700982: step: 732/530, loss: 0.009203272871673107 2023-01-22 17:16:21.775253: step: 736/530, loss: 0.011367706581950188 2023-01-22 17:16:22.866803: step: 740/530, loss: 0.03039545565843582 2023-01-22 17:16:23.972799: step: 744/530, loss: 0.0032586485613137484 2023-01-22 17:16:25.073333: step: 748/530, loss: 0.02519851364195347 2023-01-22 17:16:26.179430: step: 752/530, loss: 0.014162487350404263 2023-01-22 17:16:27.294229: step: 756/530, loss: 0.0062086861580610275 2023-01-22 17:16:28.383177: step: 760/530, loss: 0.007211018819361925 2023-01-22 17:16:29.477784: step: 764/530, loss: 0.0024865069426596165 2023-01-22 17:16:30.564547: step: 768/530, loss: 0.0297025665640831 2023-01-22 17:16:31.638194: step: 772/530, loss: 0.009920384734869003 2023-01-22 17:16:32.735297: step: 776/530, loss: 0.011691642925143242 2023-01-22 17:16:33.834474: step: 780/530, loss: 0.004452267196029425 2023-01-22 17:16:34.948572: step: 784/530, loss: 0.027387509122490883 2023-01-22 17:16:36.045870: step: 788/530, loss: 0.010054368525743484 2023-01-22 17:16:37.146074: step: 792/530, loss: 0.005780488718301058 2023-01-22 17:16:38.242513: step: 796/530, loss: 0.009561055339872837 2023-01-22 17:16:39.366668: step: 800/530, loss: 0.0407571941614151 2023-01-22 17:16:40.464583: step: 804/530, loss: 0.012976707890629768 2023-01-22 17:16:41.557432: step: 808/530, loss: 0.041171710938215256 2023-01-22 17:16:42.673934: step: 812/530, loss: 0.006434359587728977 2023-01-22 17:16:43.787925: step: 816/530, loss: 0.019613947719335556 2023-01-22 17:16:44.888748: step: 820/530, loss: 0.01882244274020195 2023-01-22 17:16:46.026759: step: 824/530, loss: 0.04118381068110466 2023-01-22 17:16:47.111097: step: 828/530, loss: 0.04458343982696533 2023-01-22 17:16:48.194517: step: 832/530, loss: 0.009364611469209194 2023-01-22 17:16:49.302390: step: 836/530, loss: 0.003201334970071912 2023-01-22 17:16:50.420202: step: 840/530, loss: 0.012826669961214066 2023-01-22 17:16:51.495662: step: 844/530, loss: 0.007696354761719704 2023-01-22 17:16:52.582275: step: 848/530, loss: 0.013038534671068192 2023-01-22 17:16:53.686873: step: 852/530, loss: 0.0034489654935896397 2023-01-22 17:16:54.780666: step: 856/530, loss: 0.019957341253757477 2023-01-22 17:16:55.879159: step: 860/530, loss: 0.04034833982586861 2023-01-22 17:16:56.972563: step: 864/530, loss: 0.005544763058423996 2023-01-22 17:16:58.095514: step: 868/530, loss: 0.011408579535782337 2023-01-22 17:16:59.170355: step: 872/530, loss: 0.0009432925726287067 2023-01-22 17:17:00.262222: step: 876/530, loss: 0.02067532017827034 2023-01-22 17:17:01.339357: step: 880/530, loss: 0.03105892613530159 2023-01-22 17:17:02.427064: step: 884/530, loss: 0.0001108178767026402 2023-01-22 17:17:03.553284: step: 888/530, loss: 0.0308159701526165 2023-01-22 17:17:04.641914: step: 892/530, loss: 0.010535906068980694 2023-01-22 17:17:05.730759: step: 896/530, loss: 0.03460075333714485 2023-01-22 17:17:06.818478: step: 900/530, loss: 0.004548558034002781 2023-01-22 17:17:07.899249: step: 904/530, loss: 0.003941976930946112 2023-01-22 17:17:08.999276: step: 908/530, loss: 0.04560186341404915 2023-01-22 17:17:10.116354: step: 912/530, loss: 0.053826577961444855 2023-01-22 17:17:11.229657: step: 916/530, loss: 0.020927051082253456 2023-01-22 17:17:12.293429: step: 920/530, loss: 0.008506862446665764 2023-01-22 17:17:13.412093: step: 924/530, loss: 0.0068391673266887665 2023-01-22 17:17:14.518338: step: 928/530, loss: 0.006463491357862949 2023-01-22 17:17:15.589953: step: 932/530, loss: 0.020972708240151405 2023-01-22 17:17:16.674574: step: 936/530, loss: 0.0030379327945411205 2023-01-22 17:17:17.758270: step: 940/530, loss: 0.01844375766813755 2023-01-22 17:17:18.833113: step: 944/530, loss: 0.00045030046021565795 2023-01-22 17:17:19.934447: step: 948/530, loss: 0.013975881040096283 2023-01-22 17:17:21.009795: step: 952/530, loss: 0.015563739463686943 2023-01-22 17:17:22.094365: step: 956/530, loss: 0.0052184234373271465 2023-01-22 17:17:23.176310: step: 960/530, loss: 0.04436177387833595 2023-01-22 17:17:24.276340: step: 964/530, loss: 0.005312021821737289 2023-01-22 17:17:25.352958: step: 968/530, loss: 0.0015295686898753047 2023-01-22 17:17:26.457129: step: 972/530, loss: 0.010709281079471111 2023-01-22 17:17:27.515927: step: 976/530, loss: 0.00014532609202433378 2023-01-22 17:17:28.614836: step: 980/530, loss: 0.01103973388671875 2023-01-22 17:17:29.702724: step: 984/530, loss: 0.0076539963483810425 2023-01-22 17:17:30.781539: step: 988/530, loss: 0.004451177082955837 2023-01-22 17:17:31.905250: step: 992/530, loss: 0.035717714577913284 2023-01-22 17:17:32.995097: step: 996/530, loss: 0.05799010768532753 2023-01-22 17:17:34.078889: step: 1000/530, loss: 0.010364919900894165 2023-01-22 17:17:35.173612: step: 1004/530, loss: 0.004060240462422371 2023-01-22 17:17:36.258328: step: 1008/530, loss: 0.035794422030448914 2023-01-22 17:17:37.354537: step: 1012/530, loss: 0.005741428583860397 2023-01-22 17:17:38.470733: step: 1016/530, loss: 0.005371949169784784 2023-01-22 17:17:39.565736: step: 1020/530, loss: 0.008296807296574116 2023-01-22 17:17:40.649729: step: 1024/530, loss: 0.0060907816514372826 2023-01-22 17:17:41.744905: step: 1028/530, loss: 0.003747503738850355 2023-01-22 17:17:42.828617: step: 1032/530, loss: 0.032581131905317307 2023-01-22 17:17:43.946264: step: 1036/530, loss: 0.006987593602389097 2023-01-22 17:17:45.014319: step: 1040/530, loss: 0.02342052012681961 2023-01-22 17:17:46.073524: step: 1044/530, loss: 0.0023827464319765568 2023-01-22 17:17:47.198060: step: 1048/530, loss: 0.04525222256779671 2023-01-22 17:17:48.291784: step: 1052/530, loss: 0.007199571933597326 2023-01-22 17:17:49.388479: step: 1056/530, loss: 0.01801137812435627 2023-01-22 17:17:50.490719: step: 1060/530, loss: 0.03630020469427109 2023-01-22 17:17:51.570741: step: 1064/530, loss: 0.0016164183616638184 2023-01-22 17:17:52.666673: step: 1068/530, loss: 0.0035438472405076027 2023-01-22 17:17:53.743891: step: 1072/530, loss: 0.010327319614589214 2023-01-22 17:17:54.839288: step: 1076/530, loss: 0.006465037353336811 2023-01-22 17:17:55.944009: step: 1080/530, loss: 0.0003414069360587746 2023-01-22 17:17:57.038606: step: 1084/530, loss: 0.006829671561717987 2023-01-22 17:17:58.114512: step: 1088/530, loss: 0.04112397879362106 2023-01-22 17:17:59.184434: step: 1092/530, loss: 0.007807550020515919 2023-01-22 17:18:00.278218: step: 1096/530, loss: 0.022542793303728104 2023-01-22 17:18:01.348382: step: 1100/530, loss: 0.006746973842382431 2023-01-22 17:18:02.451908: step: 1104/530, loss: 0.00983869656920433 2023-01-22 17:18:03.533355: step: 1108/530, loss: 0.049351684749126434 2023-01-22 17:18:04.626142: step: 1112/530, loss: 0.023587143048644066 2023-01-22 17:18:05.735630: step: 1116/530, loss: 0.00761682353913784 2023-01-22 17:18:06.824070: step: 1120/530, loss: 0.004863751120865345 2023-01-22 17:18:07.947182: step: 1124/530, loss: 0.007675236091017723 2023-01-22 17:18:09.025630: step: 1128/530, loss: 0.007254406344145536 2023-01-22 17:18:10.120600: step: 1132/530, loss: 0.032132767140865326 2023-01-22 17:18:11.195887: step: 1136/530, loss: 0.0 2023-01-22 17:18:12.286028: step: 1140/530, loss: 0.013009486719965935 2023-01-22 17:18:13.367181: step: 1144/530, loss: 0.009483582340180874 2023-01-22 17:18:14.477527: step: 1148/530, loss: 0.008291544392704964 2023-01-22 17:18:15.567876: step: 1152/530, loss: 0.07039010524749756 2023-01-22 17:18:16.659996: step: 1156/530, loss: 0.006580561399459839 2023-01-22 17:18:17.760346: step: 1160/530, loss: 0.011134467087686062 2023-01-22 17:18:18.846132: step: 1164/530, loss: 0.005670149344950914 2023-01-22 17:18:19.934103: step: 1168/530, loss: 0.007107221055775881 2023-01-22 17:18:21.028963: step: 1172/530, loss: 0.008636192418634892 2023-01-22 17:18:22.116244: step: 1176/530, loss: 0.007439135108143091 2023-01-22 17:18:23.203670: step: 1180/530, loss: 0.014782206155359745 2023-01-22 17:18:24.300079: step: 1184/530, loss: 0.010683221742510796 2023-01-22 17:18:25.400545: step: 1188/530, loss: 0.006635103840380907 2023-01-22 17:18:26.479535: step: 1192/530, loss: 0.006144394166767597 2023-01-22 17:18:27.582471: step: 1196/530, loss: 0.0116724893450737 2023-01-22 17:18:28.683745: step: 1200/530, loss: 0.008740604855120182 2023-01-22 17:18:29.772579: step: 1204/530, loss: 0.003188355825841427 2023-01-22 17:18:30.867338: step: 1208/530, loss: 0.026846351101994514 2023-01-22 17:18:31.944483: step: 1212/530, loss: 0.009961804375052452 2023-01-22 17:18:33.026287: step: 1216/530, loss: 0.012602888979017735 2023-01-22 17:18:34.106750: step: 1220/530, loss: 0.00370414718054235 2023-01-22 17:18:35.182967: step: 1224/530, loss: 0.0043518319725990295 2023-01-22 17:18:36.296492: step: 1228/530, loss: 0.003109956393018365 2023-01-22 17:18:37.419926: step: 1232/530, loss: 0.012438689358532429 2023-01-22 17:18:38.521065: step: 1236/530, loss: 0.02567046508193016 2023-01-22 17:18:39.600422: step: 1240/530, loss: 0.004578316118568182 2023-01-22 17:18:40.700395: step: 1244/530, loss: 0.00847189873456955 2023-01-22 17:18:41.812745: step: 1248/530, loss: 0.012865513563156128 2023-01-22 17:18:42.906572: step: 1252/530, loss: 0.005565828178077936 2023-01-22 17:18:44.014667: step: 1256/530, loss: 0.08082952350378036 2023-01-22 17:18:45.078989: step: 1260/530, loss: 0.007097425404936075 2023-01-22 17:18:46.174180: step: 1264/530, loss: 0.053296253085136414 2023-01-22 17:18:47.288800: step: 1268/530, loss: 0.05518532544374466 2023-01-22 17:18:48.378608: step: 1272/530, loss: 0.0029264793265610933 2023-01-22 17:18:49.441414: step: 1276/530, loss: 0.0028281453996896744 2023-01-22 17:18:50.564009: step: 1280/530, loss: 0.06469020992517471 2023-01-22 17:18:51.637337: step: 1284/530, loss: 0.002533006016165018 2023-01-22 17:18:52.705059: step: 1288/530, loss: 0.02022383362054825 2023-01-22 17:18:53.771969: step: 1292/530, loss: 0.012499403208494186 2023-01-22 17:18:54.868729: step: 1296/530, loss: 0.00623535830527544 2023-01-22 17:18:55.957979: step: 1300/530, loss: 0.0021335294004529715 2023-01-22 17:18:57.060844: step: 1304/530, loss: 0.04678473621606827 2023-01-22 17:18:58.149985: step: 1308/530, loss: 0.023786287754774094 2023-01-22 17:18:59.236807: step: 1312/530, loss: 0.01839214190840721 2023-01-22 17:19:00.342242: step: 1316/530, loss: 0.00917195063084364 2023-01-22 17:19:01.437042: step: 1320/530, loss: 0.011823109351098537 2023-01-22 17:19:02.556603: step: 1324/530, loss: 0.007667298428714275 2023-01-22 17:19:03.638034: step: 1328/530, loss: 0.06011826545000076 2023-01-22 17:19:04.742986: step: 1332/530, loss: 0.04796822369098663 2023-01-22 17:19:05.823094: step: 1336/530, loss: 0.006836344953626394 2023-01-22 17:19:06.919900: step: 1340/530, loss: 0.00395851070061326 2023-01-22 17:19:07.983791: step: 1344/530, loss: 0.006227710284292698 2023-01-22 17:19:09.069103: step: 1348/530, loss: 0.02330593764781952 2023-01-22 17:19:10.155391: step: 1352/530, loss: 0.00745026022195816 2023-01-22 17:19:11.247357: step: 1356/530, loss: 0.004284335300326347 2023-01-22 17:19:12.322633: step: 1360/530, loss: 0.003827574197202921 2023-01-22 17:19:13.381824: step: 1364/530, loss: 0.0037481170147657394 2023-01-22 17:19:14.502635: step: 1368/530, loss: 0.012344997376203537 2023-01-22 17:19:15.591518: step: 1372/530, loss: 0.012376873753964901 2023-01-22 17:19:16.677857: step: 1376/530, loss: 0.004207395017147064 2023-01-22 17:19:17.768096: step: 1380/530, loss: 0.004015093669295311 2023-01-22 17:19:18.846491: step: 1384/530, loss: 0.00776244979351759 2023-01-22 17:19:19.923923: step: 1388/530, loss: 0.006806132383644581 2023-01-22 17:19:21.029742: step: 1392/530, loss: 0.012347176671028137 2023-01-22 17:19:22.132912: step: 1396/530, loss: 0.04131225496530533 2023-01-22 17:19:23.220509: step: 1400/530, loss: 0.005150005221366882 2023-01-22 17:19:24.306567: step: 1404/530, loss: 0.026020819321274757 2023-01-22 17:19:25.381246: step: 1408/530, loss: 0.009125958196818829 2023-01-22 17:19:26.494453: step: 1412/530, loss: 0.010478360578417778 2023-01-22 17:19:27.589107: step: 1416/530, loss: 0.012633388862013817 2023-01-22 17:19:28.688960: step: 1420/530, loss: 0.011061619967222214 2023-01-22 17:19:29.780983: step: 1424/530, loss: 0.005792701151221991 2023-01-22 17:19:30.875461: step: 1428/530, loss: 0.011377145536243916 2023-01-22 17:19:31.979368: step: 1432/530, loss: 0.024892304092645645 2023-01-22 17:19:33.076554: step: 1436/530, loss: 0.006165762897580862 2023-01-22 17:19:34.191870: step: 1440/530, loss: 0.03086588717997074 2023-01-22 17:19:35.282208: step: 1444/530, loss: 0.010979481041431427 2023-01-22 17:19:36.383874: step: 1448/530, loss: 0.02529328502714634 2023-01-22 17:19:37.443448: step: 1452/530, loss: 0.006963388528674841 2023-01-22 17:19:38.574610: step: 1456/530, loss: 0.051081933081150055 2023-01-22 17:19:39.671913: step: 1460/530, loss: 0.017252610996365547 2023-01-22 17:19:40.750603: step: 1464/530, loss: 0.00937830563634634 2023-01-22 17:19:41.864445: step: 1468/530, loss: 0.03347708657383919 2023-01-22 17:19:42.936367: step: 1472/530, loss: 0.0019538993947207928 2023-01-22 17:19:44.016429: step: 1476/530, loss: 0.0055658030323684216 2023-01-22 17:19:45.125681: step: 1480/530, loss: 0.016274578869342804 2023-01-22 17:19:46.232530: step: 1484/530, loss: 0.012164952233433723 2023-01-22 17:19:47.328122: step: 1488/530, loss: 0.0 2023-01-22 17:19:48.425395: step: 1492/530, loss: 0.04196206480264664 2023-01-22 17:19:49.527688: step: 1496/530, loss: 0.011771033518016338 2023-01-22 17:19:50.636887: step: 1500/530, loss: 0.011590060777962208 2023-01-22 17:19:51.711083: step: 1504/530, loss: 0.01295036356896162 2023-01-22 17:19:52.803232: step: 1508/530, loss: 0.034659143537282944 2023-01-22 17:19:53.880299: step: 1512/530, loss: 0.002883182605728507 2023-01-22 17:19:54.974468: step: 1516/530, loss: 0.0041257720440626144 2023-01-22 17:19:56.087162: step: 1520/530, loss: 0.026274969801306725 2023-01-22 17:19:57.159687: step: 1524/530, loss: 0.03965918719768524 2023-01-22 17:19:58.245370: step: 1528/530, loss: 0.009315415285527706 2023-01-22 17:19:59.323917: step: 1532/530, loss: 0.01658005639910698 2023-01-22 17:20:00.388820: step: 1536/530, loss: 0.005782548803836107 2023-01-22 17:20:01.472664: step: 1540/530, loss: 0.010098210535943508 2023-01-22 17:20:02.576780: step: 1544/530, loss: 0.044509027153253555 2023-01-22 17:20:03.635795: step: 1548/530, loss: 0.004450908862054348 2023-01-22 17:20:04.744780: step: 1552/530, loss: 0.0024891409557312727 2023-01-22 17:20:05.864339: step: 1556/530, loss: 0.006433618720620871 2023-01-22 17:20:06.957974: step: 1560/530, loss: 0.01959502324461937 2023-01-22 17:20:08.033841: step: 1564/530, loss: 0.005832815542817116 2023-01-22 17:20:09.151262: step: 1568/530, loss: 0.00603628670796752 2023-01-22 17:20:10.255285: step: 1572/530, loss: 0.008451227098703384 2023-01-22 17:20:11.368413: step: 1576/530, loss: 0.0048043313436210155 2023-01-22 17:20:12.466984: step: 1580/530, loss: 0.024757657200098038 2023-01-22 17:20:13.565517: step: 1584/530, loss: 0.04192760959267616 2023-01-22 17:20:14.672297: step: 1588/530, loss: 0.008118299767374992 2023-01-22 17:20:15.769711: step: 1592/530, loss: 0.005396769382059574 2023-01-22 17:20:16.860630: step: 1596/530, loss: 0.041538264602422714 2023-01-22 17:20:17.949792: step: 1600/530, loss: 0.007196536287665367 2023-01-22 17:20:19.043955: step: 1604/530, loss: 0.00934265274554491 2023-01-22 17:20:20.129294: step: 1608/530, loss: 0.009051230736076832 2023-01-22 17:20:21.217252: step: 1612/530, loss: 0.004858491476625204 2023-01-22 17:20:22.301365: step: 1616/530, loss: 0.002977528842166066 2023-01-22 17:20:23.399884: step: 1620/530, loss: 0.037747953087091446 2023-01-22 17:20:24.490344: step: 1624/530, loss: 0.03636101260781288 2023-01-22 17:20:25.574158: step: 1628/530, loss: 0.006396973505616188 2023-01-22 17:20:26.669189: step: 1632/530, loss: 0.02565055340528488 2023-01-22 17:20:27.748359: step: 1636/530, loss: 0.0019030816620215774 2023-01-22 17:20:28.832950: step: 1640/530, loss: 0.013001527637243271 2023-01-22 17:20:29.940819: step: 1644/530, loss: 0.054762933403253555 2023-01-22 17:20:31.049931: step: 1648/530, loss: 0.00581360375508666 2023-01-22 17:20:32.114784: step: 1652/530, loss: 0.005165275186300278 2023-01-22 17:20:33.209403: step: 1656/530, loss: 0.0051534841768443584 2023-01-22 17:20:34.293251: step: 1660/530, loss: 0.040944743901491165 2023-01-22 17:20:35.379824: step: 1664/530, loss: 0.012922110967338085 2023-01-22 17:20:36.479714: step: 1668/530, loss: 0.01060144416987896 2023-01-22 17:20:37.560595: step: 1672/530, loss: 0.009440352208912373 2023-01-22 17:20:38.631364: step: 1676/530, loss: 0.006665647029876709 2023-01-22 17:20:39.729814: step: 1680/530, loss: 0.04775189608335495 2023-01-22 17:20:40.816476: step: 1684/530, loss: 0.01774897426366806 2023-01-22 17:20:41.904439: step: 1688/530, loss: 0.03745989128947258 2023-01-22 17:20:42.997072: step: 1692/530, loss: 0.011849308386445045 2023-01-22 17:20:44.074240: step: 1696/530, loss: 0.006372003350406885 2023-01-22 17:20:45.163256: step: 1700/530, loss: 0.007675140164792538 2023-01-22 17:20:46.264125: step: 1704/530, loss: 0.014992504380643368 2023-01-22 17:20:47.360732: step: 1708/530, loss: 0.006380526348948479 2023-01-22 17:20:48.462501: step: 1712/530, loss: 0.017169829457998276 2023-01-22 17:20:49.532861: step: 1716/530, loss: 0.024744641035795212 2023-01-22 17:20:50.640778: step: 1720/530, loss: 0.048928651958703995 2023-01-22 17:20:51.724722: step: 1724/530, loss: 0.005339645780622959 2023-01-22 17:20:52.813306: step: 1728/530, loss: 0.004798244684934616 2023-01-22 17:20:53.902845: step: 1732/530, loss: 0.021579215303063393 2023-01-22 17:20:55.001099: step: 1736/530, loss: 0.028703859075903893 2023-01-22 17:20:56.091910: step: 1740/530, loss: 0.0072754002176225185 2023-01-22 17:20:57.207923: step: 1744/530, loss: 0.04253525286912918 2023-01-22 17:20:58.301924: step: 1748/530, loss: 0.003510440466925502 2023-01-22 17:20:59.428578: step: 1752/530, loss: 0.005049799103289843 2023-01-22 17:21:00.519566: step: 1756/530, loss: 0.018389668315649033 2023-01-22 17:21:01.616064: step: 1760/530, loss: 0.0036845372524112463 2023-01-22 17:21:02.687852: step: 1764/530, loss: 0.0026990945916622877 2023-01-22 17:21:03.783269: step: 1768/530, loss: 0.03512921556830406 2023-01-22 17:21:04.890189: step: 1772/530, loss: 0.005441419780254364 2023-01-22 17:21:05.977917: step: 1776/530, loss: 0.006914149038493633 2023-01-22 17:21:07.069963: step: 1780/530, loss: 0.004507198929786682 2023-01-22 17:21:08.153646: step: 1784/530, loss: 0.01564428210258484 2023-01-22 17:21:09.233278: step: 1788/530, loss: 0.0042689889669418335 2023-01-22 17:21:10.310697: step: 1792/530, loss: 0.004463187884539366 2023-01-22 17:21:11.393595: step: 1796/530, loss: 0.009166345000267029 2023-01-22 17:21:12.505311: step: 1800/530, loss: 0.004761158023029566 2023-01-22 17:21:13.587956: step: 1804/530, loss: 0.009483604691922665 2023-01-22 17:21:14.693305: step: 1808/530, loss: 0.008102762512862682 2023-01-22 17:21:15.780569: step: 1812/530, loss: 0.0076997848227620125 2023-01-22 17:21:16.870793: step: 1816/530, loss: 0.010463826358318329 2023-01-22 17:21:17.965886: step: 1820/530, loss: 0.0031284149736166 2023-01-22 17:21:19.033708: step: 1824/530, loss: 0.004331889096647501 2023-01-22 17:21:20.116054: step: 1828/530, loss: 0.009172449819743633 2023-01-22 17:21:21.220517: step: 1832/530, loss: 0.06897719949483871 2023-01-22 17:21:22.300098: step: 1836/530, loss: 0.0036861842963844538 2023-01-22 17:21:23.408753: step: 1840/530, loss: 0.0324915274977684 2023-01-22 17:21:24.502858: step: 1844/530, loss: 0.03383469209074974 2023-01-22 17:21:25.596929: step: 1848/530, loss: 0.00970512069761753 2023-01-22 17:21:26.687610: step: 1852/530, loss: 0.011853737756609917 2023-01-22 17:21:27.799459: step: 1856/530, loss: 0.0028102637734264135 2023-01-22 17:21:28.874168: step: 1860/530, loss: 0.1190100684762001 2023-01-22 17:21:29.954820: step: 1864/530, loss: 0.019448217004537582 2023-01-22 17:21:31.035998: step: 1868/530, loss: 0.010541149415075779 2023-01-22 17:21:32.129917: step: 1872/530, loss: 0.004271318670362234 2023-01-22 17:21:33.226169: step: 1876/530, loss: 0.007992695085704327 2023-01-22 17:21:34.326516: step: 1880/530, loss: 0.0023088206071406603 2023-01-22 17:21:35.435569: step: 1884/530, loss: 0.01651832088828087 2023-01-22 17:21:36.548998: step: 1888/530, loss: 0.014331793412566185 2023-01-22 17:21:37.639493: step: 1892/530, loss: 0.0037648214492946863 2023-01-22 17:21:38.762233: step: 1896/530, loss: 0.009419191628694534 2023-01-22 17:21:39.888306: step: 1900/530, loss: 0.00566993560642004 2023-01-22 17:21:41.006850: step: 1904/530, loss: 0.010001144371926785 2023-01-22 17:21:42.081094: step: 1908/530, loss: 0.00864218920469284 2023-01-22 17:21:43.184577: step: 1912/530, loss: 0.010635146871209145 2023-01-22 17:21:44.284593: step: 1916/530, loss: 0.012258029542863369 2023-01-22 17:21:45.363808: step: 1920/530, loss: 0.004968596156686544 2023-01-22 17:21:46.459482: step: 1924/530, loss: 0.04668574780225754 2023-01-22 17:21:47.546722: step: 1928/530, loss: 0.034046854823827744 2023-01-22 17:21:48.653678: step: 1932/530, loss: 0.03584835305809975 2023-01-22 17:21:49.743480: step: 1936/530, loss: 0.04924082010984421 2023-01-22 17:21:50.812531: step: 1940/530, loss: 0.008164254017174244 2023-01-22 17:21:51.897744: step: 1944/530, loss: 0.011303422041237354 2023-01-22 17:21:53.020547: step: 1948/530, loss: 0.009488912299275398 2023-01-22 17:21:54.096892: step: 1952/530, loss: 0.003806962864473462 2023-01-22 17:21:55.199553: step: 1956/530, loss: 0.027558019384741783 2023-01-22 17:21:56.305351: step: 1960/530, loss: 0.007914615795016289 2023-01-22 17:21:57.378998: step: 1964/530, loss: 0.0032007251866161823 2023-01-22 17:21:58.492924: step: 1968/530, loss: 0.03232016786932945 2023-01-22 17:21:59.562856: step: 1972/530, loss: 0.0053441342897713184 2023-01-22 17:22:00.653516: step: 1976/530, loss: 0.01302309799939394 2023-01-22 17:22:01.739644: step: 1980/530, loss: 0.022190343588590622 2023-01-22 17:22:02.834221: step: 1984/530, loss: 0.006786705460399389 2023-01-22 17:22:03.946948: step: 1988/530, loss: 0.012712826021015644 2023-01-22 17:22:05.034132: step: 1992/530, loss: 0.007025027181953192 2023-01-22 17:22:06.115629: step: 1996/530, loss: 0.0010213572531938553 2023-01-22 17:22:07.217378: step: 2000/530, loss: 0.01323331892490387 2023-01-22 17:22:08.323631: step: 2004/530, loss: 0.017328208312392235 2023-01-22 17:22:09.412789: step: 2008/530, loss: 0.019475113600492477 2023-01-22 17:22:10.485549: step: 2012/530, loss: 0.04903915524482727 2023-01-22 17:22:11.578654: step: 2016/530, loss: 0.006896850187331438 2023-01-22 17:22:12.662513: step: 2020/530, loss: 0.024892330169677734 2023-01-22 17:22:13.754670: step: 2024/530, loss: 0.01610695756971836 2023-01-22 17:22:14.855698: step: 2028/530, loss: 0.03003283403813839 2023-01-22 17:22:15.941890: step: 2032/530, loss: 0.0017887263093143702 2023-01-22 17:22:17.045878: step: 2036/530, loss: 0.008579340763390064 2023-01-22 17:22:18.142039: step: 2040/530, loss: 0.035815708339214325 2023-01-22 17:22:19.230704: step: 2044/530, loss: 0.007980084046721458 2023-01-22 17:22:20.359644: step: 2048/530, loss: 0.044137533754110336 2023-01-22 17:22:21.441700: step: 2052/530, loss: 0.0021754472982138395 2023-01-22 17:22:22.537430: step: 2056/530, loss: 0.0056371125392615795 2023-01-22 17:22:23.622868: step: 2060/530, loss: 0.00535947410389781 2023-01-22 17:22:24.711851: step: 2064/530, loss: 0.03193186968564987 2023-01-22 17:22:25.820861: step: 2068/530, loss: 0.0052633220329880714 2023-01-22 17:22:26.900906: step: 2072/530, loss: 0.022842828184366226 2023-01-22 17:22:27.986345: step: 2076/530, loss: 0.01033526286482811 2023-01-22 17:22:29.069762: step: 2080/530, loss: 0.0030002822168171406 2023-01-22 17:22:30.171786: step: 2084/530, loss: 0.010663585737347603 2023-01-22 17:22:31.259111: step: 2088/530, loss: 0.0029286956414580345 2023-01-22 17:22:32.361122: step: 2092/530, loss: 0.010178258642554283 2023-01-22 17:22:33.466287: step: 2096/530, loss: 0.019944066181778908 2023-01-22 17:22:34.556619: step: 2100/530, loss: 0.007491804659366608 2023-01-22 17:22:35.642094: step: 2104/530, loss: 0.004933681804686785 2023-01-22 17:22:36.729297: step: 2108/530, loss: 0.006967674940824509 2023-01-22 17:22:37.828731: step: 2112/530, loss: 0.01465792115777731 2023-01-22 17:22:38.913301: step: 2116/530, loss: 0.004928010981529951 2023-01-22 17:22:40.000798: step: 2120/530, loss: 0.012756621465086937 ================================================== Loss: 0.016 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34074334029772785, 'r': 0.3536747763621578, 'f1': 0.34708865389731314}, 'combined': 0.2557495344506518, 'stategy': 1, 'epoch': 1} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33347831328300875, 'r': 0.2823515689122211, 'f1': 0.30579264720970056}, 'combined': 0.1899133282670772, 'stategy': 1, 'epoch': 1} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.35259574920970843, 'r': 0.339883568498163, 'f1': 0.34612297700199396}, 'combined': 0.2550379830541008, 'stategy': 1, 'epoch': 1} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31976221915024255, 'r': 0.2833896620757837, 'f1': 0.30047923267815135}, 'combined': 0.18661341818958874, 'stategy': 1, 'epoch': 1} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3422990007715465, 'r': 0.32281328915267293, 'f1': 0.3322707097333176}, 'combined': 0.24483104927718138, 'stategy': 1, 'epoch': 1} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34442683573720273, 'r': 0.2894000631638035, 'f1': 0.31452482748992144}, 'combined': 0.19533647180953018, 'stategy': 1, 'epoch': 1} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 1} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 1} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 1} New best chinese model... New best korean model... New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34074334029772785, 'r': 0.3536747763621578, 'f1': 0.34708865389731314}, 'combined': 0.2557495344506518, 'stategy': 1, 'epoch': 1} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33347831328300875, 'r': 0.2823515689122211, 'f1': 0.30579264720970056}, 'combined': 0.1899133282670772, 'stategy': 1, 'epoch': 1} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 1} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.35259574920970843, 'r': 0.339883568498163, 'f1': 0.34612297700199396}, 'combined': 0.2550379830541008, 'stategy': 1, 'epoch': 1} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31976221915024255, 'r': 0.2833896620757837, 'f1': 0.30047923267815135}, 'combined': 0.18661341818958874, 'stategy': 1, 'epoch': 1} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 1} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3422990007715465, 'r': 0.32281328915267293, 'f1': 0.3322707097333176}, 'combined': 0.24483104927718138, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34442683573720273, 'r': 0.2894000631638035, 'f1': 0.31452482748992144}, 'combined': 0.19533647180953018, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 2 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 17:25:24.822310: step: 4/530, loss: 0.012391503900289536 2023-01-22 17:25:25.901499: step: 8/530, loss: 0.007634381297975779 2023-01-22 17:25:26.992837: step: 12/530, loss: 0.0344882532954216 2023-01-22 17:25:28.085262: step: 16/530, loss: 0.008949057199060917 2023-01-22 17:25:29.173323: step: 20/530, loss: 0.014058766886591911 2023-01-22 17:25:30.260095: step: 24/530, loss: 0.01798669435083866 2023-01-22 17:25:31.344494: step: 28/530, loss: 0.03188132122159004 2023-01-22 17:25:32.459770: step: 32/530, loss: 0.017498953267931938 2023-01-22 17:25:33.549345: step: 36/530, loss: 0.004909016191959381 2023-01-22 17:25:34.632293: step: 40/530, loss: 0.005497514270246029 2023-01-22 17:25:35.713297: step: 44/530, loss: 0.014802170917391777 2023-01-22 17:25:36.811748: step: 48/530, loss: 0.0059297094121575356 2023-01-22 17:25:37.903114: step: 52/530, loss: 0.006121484097093344 2023-01-22 17:25:39.013914: step: 56/530, loss: 0.033066362142562866 2023-01-22 17:25:40.118799: step: 60/530, loss: 0.017747612670063972 2023-01-22 17:25:41.208046: step: 64/530, loss: 0.003740782616659999 2023-01-22 17:25:42.295961: step: 68/530, loss: 0.0008440447854809463 2023-01-22 17:25:43.361316: step: 72/530, loss: 0.044839028269052505 2023-01-22 17:25:44.481737: step: 76/530, loss: 0.0036292097065597773 2023-01-22 17:25:45.570894: step: 80/530, loss: 0.0031144428066909313 2023-01-22 17:25:46.655018: step: 84/530, loss: 0.003786178771406412 2023-01-22 17:25:47.723061: step: 88/530, loss: 0.06664510071277618 2023-01-22 17:25:48.796274: step: 92/530, loss: 0.010051997378468513 2023-01-22 17:25:49.903076: step: 96/530, loss: 0.005361826159060001 2023-01-22 17:25:50.978484: step: 100/530, loss: 0.004370855167508125 2023-01-22 17:25:52.048675: step: 104/530, loss: 0.009892871603369713 2023-01-22 17:25:53.128308: step: 108/530, loss: 0.006972011178731918 2023-01-22 17:25:54.219670: step: 112/530, loss: 0.049745917320251465 2023-01-22 17:25:55.322831: step: 116/530, loss: 0.005181717686355114 2023-01-22 17:25:56.403300: step: 120/530, loss: 0.04260662570595741 2023-01-22 17:25:57.475021: step: 124/530, loss: 0.019936926662921906 2023-01-22 17:25:58.538990: step: 128/530, loss: 0.009502381086349487 2023-01-22 17:25:59.637976: step: 132/530, loss: 0.0027861290145665407 2023-01-22 17:26:00.717741: step: 136/530, loss: 0.007031664252281189 2023-01-22 17:26:01.795265: step: 140/530, loss: 0.00249624066054821 2023-01-22 17:26:02.879791: step: 144/530, loss: 0.008162613026797771 2023-01-22 17:26:03.982555: step: 148/530, loss: 0.006209488958120346 2023-01-22 17:26:05.082727: step: 152/530, loss: 0.014237584546208382 2023-01-22 17:26:06.164328: step: 156/530, loss: 0.005376539193093777 2023-01-22 17:26:07.240575: step: 160/530, loss: 0.005726292729377747 2023-01-22 17:26:08.317392: step: 164/530, loss: 0.045714814215898514 2023-01-22 17:26:09.389071: step: 168/530, loss: 0.004599275533109903 2023-01-22 17:26:10.480326: step: 172/530, loss: 0.019371014088392258 2023-01-22 17:26:11.573863: step: 176/530, loss: 0.00452074920758605 2023-01-22 17:26:12.660878: step: 180/530, loss: 0.00240876991301775 2023-01-22 17:26:13.731510: step: 184/530, loss: 0.009490301832556725 2023-01-22 17:26:14.808687: step: 188/530, loss: 0.015913814306259155 2023-01-22 17:26:15.877453: step: 192/530, loss: 0.003869971027597785 2023-01-22 17:26:16.980747: step: 196/530, loss: 0.005710897035896778 2023-01-22 17:26:18.090045: step: 200/530, loss: 0.009119526483118534 2023-01-22 17:26:19.163623: step: 204/530, loss: 0.00745429378002882 2023-01-22 17:26:20.272616: step: 208/530, loss: 0.011853475123643875 2023-01-22 17:26:21.355709: step: 212/530, loss: 0.013891429640352726 2023-01-22 17:26:22.449988: step: 216/530, loss: 0.0012209659907966852 2023-01-22 17:26:23.556720: step: 220/530, loss: 0.016997987404465675 2023-01-22 17:26:24.652983: step: 224/530, loss: 0.006589137949049473 2023-01-22 17:26:25.733282: step: 228/530, loss: 0.005170939024537802 2023-01-22 17:26:26.813019: step: 232/530, loss: 0.007014515344053507 2023-01-22 17:26:27.887193: step: 236/530, loss: 0.0014491764595732093 2023-01-22 17:26:28.994289: step: 240/530, loss: 0.017552219331264496 2023-01-22 17:26:30.100126: step: 244/530, loss: 0.0005964357405900955 2023-01-22 17:26:31.200567: step: 248/530, loss: 0.022998103871941566 2023-01-22 17:26:32.293156: step: 252/530, loss: 0.002045807894319296 2023-01-22 17:26:33.382664: step: 256/530, loss: 0.030318327248096466 2023-01-22 17:26:34.447042: step: 260/530, loss: 0.005669730249792337 2023-01-22 17:26:35.548937: step: 264/530, loss: 0.012015166692435741 2023-01-22 17:26:36.618200: step: 268/530, loss: 0.0019308619666844606 2023-01-22 17:26:37.696775: step: 272/530, loss: 0.02902081608772278 2023-01-22 17:26:38.785371: step: 276/530, loss: 0.0015481747686862946 2023-01-22 17:26:39.839663: step: 280/530, loss: 0.015439937822520733 2023-01-22 17:26:40.932895: step: 284/530, loss: 0.002557411091402173 2023-01-22 17:26:42.049457: step: 288/530, loss: 0.010464164428412914 2023-01-22 17:26:43.128656: step: 292/530, loss: 0.005846427753567696 2023-01-22 17:26:44.211603: step: 296/530, loss: 0.0033386549912393093 2023-01-22 17:26:45.296947: step: 300/530, loss: 0.004703700542449951 2023-01-22 17:26:46.411495: step: 304/530, loss: 0.0037038058508187532 2023-01-22 17:26:47.519655: step: 308/530, loss: 0.023519383743405342 2023-01-22 17:26:48.614246: step: 312/530, loss: 0.004581342451274395 2023-01-22 17:26:49.725630: step: 316/530, loss: 0.01667645014822483 2023-01-22 17:26:50.809860: step: 320/530, loss: 0.009866605512797832 2023-01-22 17:26:51.896525: step: 324/530, loss: 0.006697378121316433 2023-01-22 17:26:53.003009: step: 328/530, loss: 0.0029570343904197216 2023-01-22 17:26:54.110204: step: 332/530, loss: 0.00546490540727973 2023-01-22 17:26:55.187980: step: 336/530, loss: 0.010721621103584766 2023-01-22 17:26:56.294965: step: 340/530, loss: 0.01307881623506546 2023-01-22 17:26:57.403576: step: 344/530, loss: 0.0055169640108942986 2023-01-22 17:26:58.476532: step: 348/530, loss: 0.012309126555919647 2023-01-22 17:26:59.562853: step: 352/530, loss: 0.003929964732378721 2023-01-22 17:27:00.634497: step: 356/530, loss: 0.0027418392710387707 2023-01-22 17:27:01.752773: step: 360/530, loss: 0.004157582297921181 2023-01-22 17:27:02.864502: step: 364/530, loss: 0.002446571597829461 2023-01-22 17:27:03.952753: step: 368/530, loss: 0.007255947683006525 2023-01-22 17:27:05.034615: step: 372/530, loss: 0.004091478884220123 2023-01-22 17:27:06.128318: step: 376/530, loss: 0.0076437462121248245 2023-01-22 17:27:07.222307: step: 380/530, loss: 0.029653025791049004 2023-01-22 17:27:08.318621: step: 384/530, loss: 0.009166298434138298 2023-01-22 17:27:09.405158: step: 388/530, loss: 0.01233306247740984 2023-01-22 17:27:10.486813: step: 392/530, loss: 0.0054398709908127785 2023-01-22 17:27:11.600764: step: 396/530, loss: 0.010394660755991936 2023-01-22 17:27:12.685511: step: 400/530, loss: 0.01157502643764019 2023-01-22 17:27:13.773105: step: 404/530, loss: 0.004937803838402033 2023-01-22 17:27:14.881952: step: 408/530, loss: 0.041797030717134476 2023-01-22 17:27:15.967871: step: 412/530, loss: 0.006708246655762196 2023-01-22 17:27:17.050538: step: 416/530, loss: 0.022681649774312973 2023-01-22 17:27:18.151103: step: 420/530, loss: 0.011472459882497787 2023-01-22 17:27:19.240440: step: 424/530, loss: 0.003999972715973854 2023-01-22 17:27:20.326303: step: 428/530, loss: 0.006213391199707985 2023-01-22 17:27:21.432372: step: 432/530, loss: 0.008885979652404785 2023-01-22 17:27:22.525757: step: 436/530, loss: 0.03559815138578415 2023-01-22 17:27:23.606982: step: 440/530, loss: 0.0028997703921049833 2023-01-22 17:27:24.699389: step: 444/530, loss: 0.007490651682019234 2023-01-22 17:27:25.776266: step: 448/530, loss: 0.006587234791368246 2023-01-22 17:27:26.871456: step: 452/530, loss: 0.01258843019604683 2023-01-22 17:27:27.957548: step: 456/530, loss: 0.0022444056812673807 2023-01-22 17:27:29.050776: step: 460/530, loss: 0.004761658143252134 2023-01-22 17:27:30.151559: step: 464/530, loss: 0.005991101264953613 2023-01-22 17:27:31.216125: step: 468/530, loss: 0.011496379040181637 2023-01-22 17:27:32.330918: step: 472/530, loss: 0.0033064144663512707 2023-01-22 17:27:33.419933: step: 476/530, loss: 0.0015110295498743653 2023-01-22 17:27:34.494262: step: 480/530, loss: 0.002834895858541131 2023-01-22 17:27:35.593145: step: 484/530, loss: 0.04340868070721626 2023-01-22 17:27:36.688743: step: 488/530, loss: 0.026502616703510284 2023-01-22 17:27:37.807865: step: 492/530, loss: 0.03256915137171745 2023-01-22 17:27:38.889043: step: 496/530, loss: 0.042726702988147736 2023-01-22 17:27:39.997143: step: 500/530, loss: 0.03379477187991142 2023-01-22 17:27:41.103781: step: 504/530, loss: 0.0456722155213356 2023-01-22 17:27:42.218533: step: 508/530, loss: 0.008975841104984283 2023-01-22 17:27:43.310206: step: 512/530, loss: 0.010568582452833652 2023-01-22 17:27:44.404835: step: 516/530, loss: 0.004530169069766998 2023-01-22 17:27:45.486956: step: 520/530, loss: 0.0050271437503397465 2023-01-22 17:27:46.577147: step: 524/530, loss: 0.0059117465279996395 2023-01-22 17:27:47.640898: step: 528/530, loss: 0.007956920191645622 2023-01-22 17:27:48.725383: step: 532/530, loss: 0.00443342886865139 2023-01-22 17:27:49.833072: step: 536/530, loss: 0.0077603361569345 2023-01-22 17:27:50.929274: step: 540/530, loss: 0.04145801439881325 2023-01-22 17:27:52.011941: step: 544/530, loss: 0.0022467821836471558 2023-01-22 17:27:53.111202: step: 548/530, loss: 0.0038608901668339968 2023-01-22 17:27:54.233097: step: 552/530, loss: 0.012951676733791828 2023-01-22 17:27:55.337105: step: 556/530, loss: 0.00817587785422802 2023-01-22 17:27:56.434809: step: 560/530, loss: 0.018627174198627472 2023-01-22 17:27:57.538132: step: 564/530, loss: 0.054581452161073685 2023-01-22 17:27:58.632630: step: 568/530, loss: 0.006028099916875362 2023-01-22 17:27:59.726678: step: 572/530, loss: 0.007498130202293396 2023-01-22 17:28:00.844647: step: 576/530, loss: 0.0036621009930968285 2023-01-22 17:28:01.942026: step: 580/530, loss: 0.02529073692858219 2023-01-22 17:28:03.051145: step: 584/530, loss: 0.003978257533162832 2023-01-22 17:28:04.148212: step: 588/530, loss: 0.023453691974282265 2023-01-22 17:28:05.275602: step: 592/530, loss: 0.004406873136758804 2023-01-22 17:28:06.402929: step: 596/530, loss: 0.00697239488363266 2023-01-22 17:28:07.505070: step: 600/530, loss: 0.003588011721149087 2023-01-22 17:28:08.612420: step: 604/530, loss: 0.006585159804672003 2023-01-22 17:28:09.711414: step: 608/530, loss: 0.0055506532080471516 2023-01-22 17:28:10.809099: step: 612/530, loss: 0.006966990884393454 2023-01-22 17:28:11.906031: step: 616/530, loss: 0.006100517697632313 2023-01-22 17:28:13.014511: step: 620/530, loss: 0.009459367953240871 2023-01-22 17:28:14.107484: step: 624/530, loss: 0.005740609485656023 2023-01-22 17:28:15.199206: step: 628/530, loss: 0.005944130476564169 2023-01-22 17:28:16.289473: step: 632/530, loss: 0.042672835290431976 2023-01-22 17:28:17.391378: step: 636/530, loss: 0.0050724768079817295 2023-01-22 17:28:18.489955: step: 640/530, loss: 0.022977346554398537 2023-01-22 17:28:19.568758: step: 644/530, loss: 0.0024776621721684933 2023-01-22 17:28:20.671078: step: 648/530, loss: 0.00833917036652565 2023-01-22 17:28:21.749464: step: 652/530, loss: 0.003180461237207055 2023-01-22 17:28:22.876008: step: 656/530, loss: 0.009908239357173443 2023-01-22 17:28:23.989239: step: 660/530, loss: 0.010503917932510376 2023-01-22 17:28:25.071486: step: 664/530, loss: 0.0063460045494139194 2023-01-22 17:28:26.173762: step: 668/530, loss: 0.04455850273370743 2023-01-22 17:28:27.281540: step: 672/530, loss: 0.0043808892369270325 2023-01-22 17:28:28.358218: step: 676/530, loss: 0.007582313846796751 2023-01-22 17:28:29.456020: step: 680/530, loss: 0.009835908189415932 2023-01-22 17:28:30.575045: step: 684/530, loss: 0.005511335097253323 2023-01-22 17:28:31.671095: step: 688/530, loss: 0.008358702063560486 2023-01-22 17:28:32.775044: step: 692/530, loss: 0.0029729404486715794 2023-01-22 17:28:33.862244: step: 696/530, loss: 0.034365374594926834 2023-01-22 17:28:34.940323: step: 700/530, loss: 0.008347341790795326 2023-01-22 17:28:36.028472: step: 704/530, loss: 0.0070320009253919125 2023-01-22 17:28:37.109882: step: 708/530, loss: 0.004852325655519962 2023-01-22 17:28:38.219821: step: 712/530, loss: 0.004159483592957258 2023-01-22 17:28:39.299947: step: 716/530, loss: 0.05728793889284134 2023-01-22 17:28:40.387117: step: 720/530, loss: 0.014387681148946285 2023-01-22 17:28:41.452567: step: 724/530, loss: 0.0014776451280340552 2023-01-22 17:28:42.557302: step: 728/530, loss: 0.006308345589786768 2023-01-22 17:28:43.646898: step: 732/530, loss: 0.0032411569263786077 2023-01-22 17:28:44.748938: step: 736/530, loss: 0.022740010172128677 2023-01-22 17:28:45.879950: step: 740/530, loss: 0.0197331253439188 2023-01-22 17:28:46.959333: step: 744/530, loss: 0.004414266441017389 2023-01-22 17:28:48.034658: step: 748/530, loss: 0.00426337867975235 2023-01-22 17:28:49.137528: step: 752/530, loss: 0.006704048719257116 2023-01-22 17:28:50.216962: step: 756/530, loss: 0.002996407449245453 2023-01-22 17:28:51.313708: step: 760/530, loss: 0.02191072888672352 2023-01-22 17:28:52.394603: step: 764/530, loss: 0.008164918050169945 2023-01-22 17:28:53.478824: step: 768/530, loss: 0.0041312649846076965 2023-01-22 17:28:54.566073: step: 772/530, loss: 0.012271516025066376 2023-01-22 17:28:55.669203: step: 776/530, loss: 0.028820911422371864 2023-01-22 17:28:56.744187: step: 780/530, loss: 0.004298738669604063 2023-01-22 17:28:57.857195: step: 784/530, loss: 0.029807010665535927 2023-01-22 17:28:58.950849: step: 788/530, loss: 0.004857347346842289 2023-01-22 17:29:00.059617: step: 792/530, loss: 0.008187413215637207 2023-01-22 17:29:01.181854: step: 796/530, loss: 0.03593704476952553 2023-01-22 17:29:02.278040: step: 800/530, loss: 0.0028564122039824724 2023-01-22 17:29:03.369252: step: 804/530, loss: 0.006321623455733061 2023-01-22 17:29:04.466278: step: 808/530, loss: 0.031741488724946976 2023-01-22 17:29:05.555561: step: 812/530, loss: 0.02111353911459446 2023-01-22 17:29:06.655667: step: 816/530, loss: 0.013843242079019547 2023-01-22 17:29:07.771361: step: 820/530, loss: 0.009732394479215145 2023-01-22 17:29:08.883357: step: 824/530, loss: 0.00735677033662796 2023-01-22 17:29:09.977187: step: 828/530, loss: 0.014589892700314522 2023-01-22 17:29:11.075337: step: 832/530, loss: 0.0028226105496287346 2023-01-22 17:29:12.180944: step: 836/530, loss: 0.0016596870264038444 2023-01-22 17:29:13.273252: step: 840/530, loss: 0.003013663226738572 2023-01-22 17:29:14.351596: step: 844/530, loss: 0.008269528858363628 2023-01-22 17:29:15.444407: step: 848/530, loss: 0.0035748162772506475 2023-01-22 17:29:16.549134: step: 852/530, loss: 0.011307514272630215 2023-01-22 17:29:17.649928: step: 856/530, loss: 0.0037999527994543314 2023-01-22 17:29:18.753568: step: 860/530, loss: 0.005010879132896662 2023-01-22 17:29:19.852941: step: 864/530, loss: 0.030367949977517128 2023-01-22 17:29:20.972333: step: 868/530, loss: 0.005125672556459904 2023-01-22 17:29:22.065825: step: 872/530, loss: 0.005078231915831566 2023-01-22 17:29:23.161181: step: 876/530, loss: 0.0036739930510520935 2023-01-22 17:29:24.256394: step: 880/530, loss: 0.0037847235798835754 2023-01-22 17:29:25.328871: step: 884/530, loss: 0.032393958419561386 2023-01-22 17:29:26.433198: step: 888/530, loss: 0.04867049679160118 2023-01-22 17:29:27.540867: step: 892/530, loss: 0.017797769978642464 2023-01-22 17:29:28.651905: step: 896/530, loss: 0.02136847749352455 2023-01-22 17:29:29.746391: step: 900/530, loss: 0.03316077962517738 2023-01-22 17:29:30.813869: step: 904/530, loss: 0.0027223387733101845 2023-01-22 17:29:31.909496: step: 908/530, loss: 0.0022718573454767466 2023-01-22 17:29:33.010228: step: 912/530, loss: 0.01857251673936844 2023-01-22 17:29:34.089361: step: 916/530, loss: 0.00319062452763319 2023-01-22 17:29:35.177701: step: 920/530, loss: 0.008814864791929722 2023-01-22 17:29:36.270655: step: 924/530, loss: 0.022224988788366318 2023-01-22 17:29:37.378634: step: 928/530, loss: 0.021893490105867386 2023-01-22 17:29:38.465054: step: 932/530, loss: 0.007734906394034624 2023-01-22 17:29:39.578897: step: 936/530, loss: 0.0033426606096327305 2023-01-22 17:29:40.672349: step: 940/530, loss: 0.008457035757601261 2023-01-22 17:29:41.757284: step: 944/530, loss: 0.01598880998790264 2023-01-22 17:29:42.868238: step: 948/530, loss: 0.012407969683408737 2023-01-22 17:29:43.972059: step: 952/530, loss: 0.011005377396941185 2023-01-22 17:29:45.104806: step: 956/530, loss: 0.009087464772164822 2023-01-22 17:29:46.183041: step: 960/530, loss: 0.006762050092220306 2023-01-22 17:29:47.289863: step: 964/530, loss: 0.005455736070871353 2023-01-22 17:29:48.405949: step: 968/530, loss: 0.0029754224233329296 2023-01-22 17:29:49.486301: step: 972/530, loss: 0.013980239629745483 2023-01-22 17:29:50.575268: step: 976/530, loss: 0.010633447207510471 2023-01-22 17:29:51.656573: step: 980/530, loss: 0.009286978282034397 2023-01-22 17:29:52.740681: step: 984/530, loss: 0.005178204737603664 2023-01-22 17:29:53.831049: step: 988/530, loss: 0.01092336792498827 2023-01-22 17:29:54.933490: step: 992/530, loss: 0.005870092660188675 2023-01-22 17:29:56.017916: step: 996/530, loss: 0.004301386419683695 2023-01-22 17:29:57.114100: step: 1000/530, loss: 0.022751811891794205 2023-01-22 17:29:58.193200: step: 1004/530, loss: 0.006232579238712788 2023-01-22 17:29:59.277853: step: 1008/530, loss: 0.06963155418634415 2023-01-22 17:30:00.363128: step: 1012/530, loss: 0.004631880205124617 2023-01-22 17:30:01.473783: step: 1016/530, loss: 0.008173738606274128 2023-01-22 17:30:02.559634: step: 1020/530, loss: 0.0032272457610815763 2023-01-22 17:30:03.653729: step: 1024/530, loss: 0.004275115672498941 2023-01-22 17:30:04.735076: step: 1028/530, loss: 0.008450631983578205 2023-01-22 17:30:05.827553: step: 1032/530, loss: 0.0003325218567624688 2023-01-22 17:30:06.920587: step: 1036/530, loss: 0.011116856709122658 2023-01-22 17:30:07.988230: step: 1040/530, loss: 0.0034582875669002533 2023-01-22 17:30:09.066331: step: 1044/530, loss: 0.0018107590731233358 2023-01-22 17:30:10.157119: step: 1048/530, loss: 0.026982396841049194 2023-01-22 17:30:11.255387: step: 1052/530, loss: 0.002509910613298416 2023-01-22 17:30:12.341758: step: 1056/530, loss: 0.012826124206185341 2023-01-22 17:30:13.427858: step: 1060/530, loss: 0.031740766018629074 2023-01-22 17:30:14.511282: step: 1064/530, loss: 0.028774620965123177 2023-01-22 17:30:15.594671: step: 1068/530, loss: 0.0026212071534246206 2023-01-22 17:30:16.681084: step: 1072/530, loss: 0.0076530794613063335 2023-01-22 17:30:17.750781: step: 1076/530, loss: 0.06592535227537155 2023-01-22 17:30:18.859218: step: 1080/530, loss: 0.0094529427587986 2023-01-22 17:30:19.957640: step: 1084/530, loss: 0.005001086741685867 2023-01-22 17:30:21.050726: step: 1088/530, loss: 0.014370698481798172 2023-01-22 17:30:22.131099: step: 1092/530, loss: 0.0329345166683197 2023-01-22 17:30:23.228770: step: 1096/530, loss: 0.03442564979195595 2023-01-22 17:30:24.319778: step: 1100/530, loss: 0.03979559242725372 2023-01-22 17:30:25.421828: step: 1104/530, loss: 0.007194514852017164 2023-01-22 17:30:26.558094: step: 1108/530, loss: 0.020551208406686783 2023-01-22 17:30:27.670145: step: 1112/530, loss: 0.006106766872107983 2023-01-22 17:30:28.770759: step: 1116/530, loss: 0.003778885118663311 2023-01-22 17:30:29.872967: step: 1120/530, loss: 0.06535742431879044 2023-01-22 17:30:30.950212: step: 1124/530, loss: 0.04842514917254448 2023-01-22 17:30:32.030201: step: 1128/530, loss: 0.06867803633213043 2023-01-22 17:30:33.113286: step: 1132/530, loss: 0.00756215862929821 2023-01-22 17:30:34.212887: step: 1136/530, loss: 0.01421402208507061 2023-01-22 17:30:35.307884: step: 1140/530, loss: 0.034601762890815735 2023-01-22 17:30:36.399793: step: 1144/530, loss: 0.006792508997023106 2023-01-22 17:30:37.496391: step: 1148/530, loss: 0.010737613774836063 2023-01-22 17:30:38.575561: step: 1152/530, loss: 0.01484235655516386 2023-01-22 17:30:39.670622: step: 1156/530, loss: 0.024346277117729187 2023-01-22 17:30:40.765315: step: 1160/530, loss: 0.027085792273283005 2023-01-22 17:30:41.870519: step: 1164/530, loss: 0.0024853956419974566 2023-01-22 17:30:42.982406: step: 1168/530, loss: 0.08352573215961456 2023-01-22 17:30:44.076128: step: 1172/530, loss: 0.03397878259420395 2023-01-22 17:30:45.175945: step: 1176/530, loss: 0.00481100007891655 2023-01-22 17:30:46.303268: step: 1180/530, loss: 0.024954786524176598 2023-01-22 17:30:47.372192: step: 1184/530, loss: 0.03177491948008537 2023-01-22 17:30:48.468025: step: 1188/530, loss: 0.010879147797822952 2023-01-22 17:30:49.554163: step: 1192/530, loss: 0.004253412131220102 2023-01-22 17:30:50.649495: step: 1196/530, loss: 0.003874037181958556 2023-01-22 17:30:51.749370: step: 1200/530, loss: 0.030718030408024788 2023-01-22 17:30:52.836587: step: 1204/530, loss: 0.009647996164858341 2023-01-22 17:30:53.924423: step: 1208/530, loss: 0.013988994993269444 2023-01-22 17:30:55.023986: step: 1212/530, loss: 0.0038821506313979626 2023-01-22 17:30:56.150026: step: 1216/530, loss: 0.007743278983980417 2023-01-22 17:30:57.253349: step: 1220/530, loss: 0.010174600407481194 2023-01-22 17:30:58.321503: step: 1224/530, loss: 0.004546063952147961 2023-01-22 17:30:59.408655: step: 1228/530, loss: 0.03946392983198166 2023-01-22 17:31:00.513898: step: 1232/530, loss: 0.0052576204761862755 2023-01-22 17:31:01.602531: step: 1236/530, loss: 0.00017730020044837147 2023-01-22 17:31:02.689320: step: 1240/530, loss: 0.0027113768737763166 2023-01-22 17:31:03.770577: step: 1244/530, loss: 0.0044046686962246895 2023-01-22 17:31:04.844063: step: 1248/530, loss: 0.004420549608767033 2023-01-22 17:31:05.932858: step: 1252/530, loss: 0.025432948023080826 2023-01-22 17:31:07.039580: step: 1256/530, loss: 0.012925539165735245 2023-01-22 17:31:08.131925: step: 1260/530, loss: 0.004398446064442396 2023-01-22 17:31:09.233185: step: 1264/530, loss: 0.001315298955887556 2023-01-22 17:31:10.321491: step: 1268/530, loss: 0.017206929624080658 2023-01-22 17:31:11.429872: step: 1272/530, loss: 0.00601047370582819 2023-01-22 17:31:12.532838: step: 1276/530, loss: 0.006891086231917143 2023-01-22 17:31:13.591641: step: 1280/530, loss: 0.0047853486612439156 2023-01-22 17:31:14.709960: step: 1284/530, loss: 0.01606903038918972 2023-01-22 17:31:15.772843: step: 1288/530, loss: 0.0858551561832428 2023-01-22 17:31:16.862065: step: 1292/530, loss: 0.04245857521891594 2023-01-22 17:31:17.951982: step: 1296/530, loss: 0.006317073479294777 2023-01-22 17:31:19.055507: step: 1300/530, loss: 0.003843980608507991 2023-01-22 17:31:20.173358: step: 1304/530, loss: 0.004499596543610096 2023-01-22 17:31:21.264958: step: 1308/530, loss: 0.013047484681010246 2023-01-22 17:31:22.363464: step: 1312/530, loss: 0.014584006741642952 2023-01-22 17:31:23.445936: step: 1316/530, loss: 0.004421008750796318 2023-01-22 17:31:24.536489: step: 1320/530, loss: 0.006567663978785276 2023-01-22 17:31:25.636166: step: 1324/530, loss: 0.012001038528978825 2023-01-22 17:31:26.720071: step: 1328/530, loss: 0.006867594551295042 2023-01-22 17:31:27.797408: step: 1332/530, loss: 0.0037352575454860926 2023-01-22 17:31:28.861372: step: 1336/530, loss: 0.0037329038605093956 2023-01-22 17:31:29.948223: step: 1340/530, loss: 0.003762504318729043 2023-01-22 17:31:31.060653: step: 1344/530, loss: 0.011309497058391571 2023-01-22 17:31:32.152503: step: 1348/530, loss: 0.011775614693760872 2023-01-22 17:31:33.242949: step: 1352/530, loss: 0.01116671971976757 2023-01-22 17:31:34.322417: step: 1356/530, loss: 0.009452038444578648 2023-01-22 17:31:35.421173: step: 1360/530, loss: 0.0030575324781239033 2023-01-22 17:31:36.503538: step: 1364/530, loss: 0.006513847969472408 2023-01-22 17:31:37.571708: step: 1368/530, loss: 0.0021709268912672997 2023-01-22 17:31:38.651546: step: 1372/530, loss: 0.0028043787460774183 2023-01-22 17:31:39.760094: step: 1376/530, loss: 0.002050436334684491 2023-01-22 17:31:40.840713: step: 1380/530, loss: 0.007309226784855127 2023-01-22 17:31:41.932672: step: 1384/530, loss: 0.0631498470902443 2023-01-22 17:31:43.021199: step: 1388/530, loss: 0.009299755096435547 2023-01-22 17:31:44.106025: step: 1392/530, loss: 0.0006266501150093973 2023-01-22 17:31:45.173739: step: 1396/530, loss: 0.002885455032810569 2023-01-22 17:31:46.263600: step: 1400/530, loss: 0.027987513691186905 2023-01-22 17:31:47.342990: step: 1404/530, loss: 0.006226013880223036 2023-01-22 17:31:48.419696: step: 1408/530, loss: 0.003627366153523326 2023-01-22 17:31:49.543451: step: 1412/530, loss: 0.0046201786026358604 2023-01-22 17:31:50.648284: step: 1416/530, loss: 0.026542022824287415 2023-01-22 17:31:51.724712: step: 1420/530, loss: 0.006074593402445316 2023-01-22 17:31:52.794021: step: 1424/530, loss: 0.003745131194591522 2023-01-22 17:31:53.884575: step: 1428/530, loss: 0.038597483187913895 2023-01-22 17:31:54.980622: step: 1432/530, loss: 0.032367486506700516 2023-01-22 17:31:56.048785: step: 1436/530, loss: 0.005088086239993572 2023-01-22 17:31:57.116290: step: 1440/530, loss: 0.010617496445775032 2023-01-22 17:31:58.220055: step: 1444/530, loss: 0.010132071562111378 2023-01-22 17:31:59.315272: step: 1448/530, loss: 0.008153957314789295 2023-01-22 17:32:00.408563: step: 1452/530, loss: 0.00618277071043849 2023-01-22 17:32:01.488714: step: 1456/530, loss: 0.0038366348017007113 2023-01-22 17:32:02.597418: step: 1460/530, loss: 0.023068279027938843 2023-01-22 17:32:03.688961: step: 1464/530, loss: 0.008380578830838203 2023-01-22 17:32:04.779766: step: 1468/530, loss: 0.03498849272727966 2023-01-22 17:32:05.889052: step: 1472/530, loss: 0.004794488660991192 2023-01-22 17:32:06.967521: step: 1476/530, loss: 0.013601918704807758 2023-01-22 17:32:08.049248: step: 1480/530, loss: 0.03223627805709839 2023-01-22 17:32:09.148858: step: 1484/530, loss: 0.004585186019539833 2023-01-22 17:32:10.244182: step: 1488/530, loss: 0.012364663183689117 2023-01-22 17:32:11.321275: step: 1492/530, loss: 0.005103865638375282 2023-01-22 17:32:12.417491: step: 1496/530, loss: 0.014150340110063553 2023-01-22 17:32:13.486617: step: 1500/530, loss: 0.01660972833633423 2023-01-22 17:32:14.601010: step: 1504/530, loss: 0.004308665636926889 2023-01-22 17:32:15.694069: step: 1508/530, loss: 0.019259531050920486 2023-01-22 17:32:16.756687: step: 1512/530, loss: 0.0035142023116350174 2023-01-22 17:32:17.867520: step: 1516/530, loss: 0.008946807123720646 2023-01-22 17:32:18.965264: step: 1520/530, loss: 0.016206560656428337 2023-01-22 17:32:20.042141: step: 1524/530, loss: 0.01725117862224579 2023-01-22 17:32:21.120143: step: 1528/530, loss: 0.004326906520873308 2023-01-22 17:32:22.253182: step: 1532/530, loss: 0.0019213708583265543 2023-01-22 17:32:23.333840: step: 1536/530, loss: 0.008800514973700047 2023-01-22 17:32:24.412724: step: 1540/530, loss: 0.005787848029285669 2023-01-22 17:32:25.508181: step: 1544/530, loss: 0.007245591841638088 2023-01-22 17:32:26.594854: step: 1548/530, loss: 0.011111351661384106 2023-01-22 17:32:27.689487: step: 1552/530, loss: 0.002489902311936021 2023-01-22 17:32:28.785733: step: 1556/530, loss: 0.008993119932711124 2023-01-22 17:32:29.906213: step: 1560/530, loss: 0.010299931280314922 2023-01-22 17:32:30.983968: step: 1564/530, loss: 0.03347787633538246 2023-01-22 17:32:32.083327: step: 1568/530, loss: 0.02024606615304947 2023-01-22 17:32:33.173207: step: 1572/530, loss: 0.0033000423572957516 2023-01-22 17:32:34.285246: step: 1576/530, loss: 0.017095889896154404 2023-01-22 17:32:35.368302: step: 1580/530, loss: 0.09861433506011963 2023-01-22 17:32:36.463738: step: 1584/530, loss: 0.008935102261602879 2023-01-22 17:32:37.565428: step: 1588/530, loss: 0.008086437359452248 2023-01-22 17:32:38.653062: step: 1592/530, loss: 0.0017422897508367896 2023-01-22 17:32:39.728349: step: 1596/530, loss: 0.023042909801006317 2023-01-22 17:32:40.824148: step: 1600/530, loss: 0.008903463371098042 2023-01-22 17:32:41.925819: step: 1604/530, loss: 0.008396804332733154 2023-01-22 17:32:42.979316: step: 1608/530, loss: 0.005524285603314638 2023-01-22 17:32:44.072338: step: 1612/530, loss: 0.022530753165483475 2023-01-22 17:32:45.162049: step: 1616/530, loss: 0.016370324417948723 2023-01-22 17:32:46.246684: step: 1620/530, loss: 0.04579024389386177 2023-01-22 17:32:47.345892: step: 1624/530, loss: 0.007668602745980024 2023-01-22 17:32:48.444770: step: 1628/530, loss: 0.003944729920476675 2023-01-22 17:32:49.509726: step: 1632/530, loss: 0.0032784356735646725 2023-01-22 17:32:50.599989: step: 1636/530, loss: 0.005256242118775845 2023-01-22 17:32:51.708953: step: 1640/530, loss: 0.005322916433215141 2023-01-22 17:32:52.798633: step: 1644/530, loss: 0.0020510840695351362 2023-01-22 17:32:53.918428: step: 1648/530, loss: 0.004503228235989809 2023-01-22 17:32:54.998705: step: 1652/530, loss: 0.015600706450641155 2023-01-22 17:32:56.087724: step: 1656/530, loss: 0.008826656267046928 2023-01-22 17:32:57.158850: step: 1660/530, loss: 0.0005036370130255818 2023-01-22 17:32:58.252757: step: 1664/530, loss: 0.047386832535266876 2023-01-22 17:32:59.361380: step: 1668/530, loss: 0.023287741467356682 2023-01-22 17:33:00.483746: step: 1672/530, loss: 0.007491467986255884 2023-01-22 17:33:01.576180: step: 1676/530, loss: 0.004142443649470806 2023-01-22 17:33:02.658071: step: 1680/530, loss: 0.007098161615431309 2023-01-22 17:33:03.735290: step: 1684/530, loss: 0.002737255534157157 2023-01-22 17:33:04.838605: step: 1688/530, loss: 0.03544925898313522 2023-01-22 17:33:05.921256: step: 1692/530, loss: 0.03142731636762619 2023-01-22 17:33:07.017260: step: 1696/530, loss: 0.032398588955402374 2023-01-22 17:33:08.110783: step: 1700/530, loss: 0.0012969091767445207 2023-01-22 17:33:09.206700: step: 1704/530, loss: 0.002732472028583288 2023-01-22 17:33:10.291710: step: 1708/530, loss: 0.04723600298166275 2023-01-22 17:33:11.379669: step: 1712/530, loss: 0.00844617560505867 2023-01-22 17:33:12.473749: step: 1716/530, loss: 0.0008941101841628551 2023-01-22 17:33:13.591355: step: 1720/530, loss: 0.020552800968289375 2023-01-22 17:33:14.687597: step: 1724/530, loss: 0.009452478028833866 2023-01-22 17:33:15.804124: step: 1728/530, loss: 0.015093473717570305 2023-01-22 17:33:16.937938: step: 1732/530, loss: 0.029983708634972572 2023-01-22 17:33:18.045196: step: 1736/530, loss: 0.014131785370409489 2023-01-22 17:33:19.114420: step: 1740/530, loss: 0.009197235107421875 2023-01-22 17:33:20.217891: step: 1744/530, loss: 0.010480126366019249 2023-01-22 17:33:21.289614: step: 1748/530, loss: 0.009321744553744793 2023-01-22 17:33:22.395405: step: 1752/530, loss: 0.009413870051503181 2023-01-22 17:33:23.512839: step: 1756/530, loss: 0.01103140227496624 2023-01-22 17:33:24.594065: step: 1760/530, loss: 0.007739428896456957 2023-01-22 17:33:25.678015: step: 1764/530, loss: 0.01679868996143341 2023-01-22 17:33:26.770736: step: 1768/530, loss: 0.010832425206899643 2023-01-22 17:33:27.843814: step: 1772/530, loss: 0.0047462922520935535 2023-01-22 17:33:28.934370: step: 1776/530, loss: 0.004021686967462301 2023-01-22 17:33:30.006776: step: 1780/530, loss: 0.0 2023-01-22 17:33:31.086424: step: 1784/530, loss: 0.005754449404776096 2023-01-22 17:33:32.181999: step: 1788/530, loss: 0.030051853507757187 2023-01-22 17:33:33.292872: step: 1792/530, loss: 0.07881727069616318 2023-01-22 17:33:34.381906: step: 1796/530, loss: 0.006806483957916498 2023-01-22 17:33:35.501499: step: 1800/530, loss: 0.029210636392235756 2023-01-22 17:33:36.595471: step: 1804/530, loss: 0.0006344731664285064 2023-01-22 17:33:37.683952: step: 1808/530, loss: 0.005361342802643776 2023-01-22 17:33:38.765607: step: 1812/530, loss: 0.008182952180504799 2023-01-22 17:33:39.849512: step: 1816/530, loss: 0.004938941914588213 2023-01-22 17:33:40.951729: step: 1820/530, loss: 0.012819604948163033 2023-01-22 17:33:42.057730: step: 1824/530, loss: 0.049621012061834335 2023-01-22 17:33:43.153232: step: 1828/530, loss: 0.004920081701129675 2023-01-22 17:33:44.250084: step: 1832/530, loss: 0.04681029170751572 2023-01-22 17:33:45.378785: step: 1836/530, loss: 0.010457811877131462 2023-01-22 17:33:46.498510: step: 1840/530, loss: 0.004233458545058966 2023-01-22 17:33:47.579727: step: 1844/530, loss: 0.025596261024475098 2023-01-22 17:33:48.648295: step: 1848/530, loss: 0.00549063365906477 2023-01-22 17:33:49.735487: step: 1852/530, loss: 0.00705106183886528 2023-01-22 17:33:50.818336: step: 1856/530, loss: 0.0004364947963040322 2023-01-22 17:33:51.927620: step: 1860/530, loss: 0.01021557580679655 2023-01-22 17:33:53.019301: step: 1864/530, loss: 0.0017422246746718884 2023-01-22 17:33:54.102196: step: 1868/530, loss: 0.0041860612109303474 2023-01-22 17:33:55.173933: step: 1872/530, loss: 0.04310573637485504 2023-01-22 17:33:56.291029: step: 1876/530, loss: 0.020023928955197334 2023-01-22 17:33:57.386150: step: 1880/530, loss: 0.00489689689129591 2023-01-22 17:33:58.484727: step: 1884/530, loss: 0.027558067813515663 2023-01-22 17:33:59.589969: step: 1888/530, loss: 0.006431622430682182 2023-01-22 17:34:00.681903: step: 1892/530, loss: 0.021379824727773666 2023-01-22 17:34:01.756208: step: 1896/530, loss: 0.009161487221717834 2023-01-22 17:34:02.834609: step: 1900/530, loss: 0.008073671720921993 2023-01-22 17:34:03.912457: step: 1904/530, loss: 0.004906642250716686 2023-01-22 17:34:04.990878: step: 1908/530, loss: 0.0034442346077412367 2023-01-22 17:34:06.070359: step: 1912/530, loss: 0.0037114170845597982 2023-01-22 17:34:07.152757: step: 1916/530, loss: 0.0037614472676068544 2023-01-22 17:34:08.207015: step: 1920/530, loss: 0.029696006327867508 2023-01-22 17:34:09.303694: step: 1924/530, loss: 0.011749030090868473 2023-01-22 17:34:10.382238: step: 1928/530, loss: 0.011213784106075764 2023-01-22 17:34:11.470099: step: 1932/530, loss: 0.0029136526864022017 2023-01-22 17:34:12.598269: step: 1936/530, loss: 0.0045543755404651165 2023-01-22 17:34:13.677550: step: 1940/530, loss: 0.013390528038144112 2023-01-22 17:34:14.771919: step: 1944/530, loss: 0.017309991642832756 2023-01-22 17:34:15.919171: step: 1948/530, loss: 0.05734814703464508 2023-01-22 17:34:17.008431: step: 1952/530, loss: 0.01196904294192791 2023-01-22 17:34:18.071028: step: 1956/530, loss: 0.022607866674661636 2023-01-22 17:34:19.156900: step: 1960/530, loss: 0.018757633864879608 2023-01-22 17:34:20.260853: step: 1964/530, loss: 0.009620281867682934 2023-01-22 17:34:21.374977: step: 1968/530, loss: 0.005232736933976412 2023-01-22 17:34:22.503288: step: 1972/530, loss: 0.008973057381808758 2023-01-22 17:34:23.586071: step: 1976/530, loss: 0.0034213506150990725 2023-01-22 17:34:24.686410: step: 1980/530, loss: 0.006188738625496626 2023-01-22 17:34:25.780807: step: 1984/530, loss: 0.004274419974535704 2023-01-22 17:34:26.873829: step: 1988/530, loss: 0.0032662139274179935 2023-01-22 17:34:27.965713: step: 1992/530, loss: 0.003156520426273346 2023-01-22 17:34:29.042994: step: 1996/530, loss: 0.010001575574278831 2023-01-22 17:34:30.153538: step: 2000/530, loss: 0.010153896175324917 2023-01-22 17:34:31.236288: step: 2004/530, loss: 0.02358771115541458 2023-01-22 17:34:32.327677: step: 2008/530, loss: 0.006304414942860603 2023-01-22 17:34:33.426952: step: 2012/530, loss: 0.027232374995946884 2023-01-22 17:34:34.515643: step: 2016/530, loss: 0.0059166159480810165 2023-01-22 17:34:35.601951: step: 2020/530, loss: 0.002335348166525364 2023-01-22 17:34:36.689389: step: 2024/530, loss: 0.005618598777800798 2023-01-22 17:34:37.782762: step: 2028/530, loss: 0.008079351857304573 2023-01-22 17:34:38.883463: step: 2032/530, loss: 0.0045247129164636135 2023-01-22 17:34:39.965124: step: 2036/530, loss: 0.018133796751499176 2023-01-22 17:34:41.052135: step: 2040/530, loss: 0.007943114265799522 2023-01-22 17:34:42.130899: step: 2044/530, loss: 0.014843118377029896 2023-01-22 17:34:43.214902: step: 2048/530, loss: 0.0059630656614899635 2023-01-22 17:34:44.317709: step: 2052/530, loss: 0.006998266093432903 2023-01-22 17:34:45.410391: step: 2056/530, loss: 0.012137621641159058 2023-01-22 17:34:46.487972: step: 2060/530, loss: 0.002685179701074958 2023-01-22 17:34:47.597991: step: 2064/530, loss: 0.005768399219959974 2023-01-22 17:34:48.700665: step: 2068/530, loss: 0.019703621044754982 2023-01-22 17:34:49.821502: step: 2072/530, loss: 0.0068180011585354805 2023-01-22 17:34:50.917410: step: 2076/530, loss: 0.0011532928328961134 2023-01-22 17:34:52.008274: step: 2080/530, loss: 0.007384370546787977 2023-01-22 17:34:53.117073: step: 2084/530, loss: 0.00564651470631361 2023-01-22 17:34:54.193159: step: 2088/530, loss: 0.004955998156219721 2023-01-22 17:34:55.301137: step: 2092/530, loss: 0.006114862393587828 2023-01-22 17:34:56.388731: step: 2096/530, loss: 0.006418767850846052 2023-01-22 17:34:57.464461: step: 2100/530, loss: 0.003920678980648518 2023-01-22 17:34:58.551239: step: 2104/530, loss: 0.0072768740355968475 2023-01-22 17:34:59.648295: step: 2108/530, loss: 0.006788167636841536 2023-01-22 17:35:00.769998: step: 2112/530, loss: 0.0168886911123991 2023-01-22 17:35:01.864959: step: 2116/530, loss: 0.012799182906746864 2023-01-22 17:35:02.976673: step: 2120/530, loss: 0.089204341173172 ================================================== Loss: 0.013 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33298328673106253, 'r': 0.3550979262672811, 'f1': 0.34368522891250164}, 'combined': 0.25324174761973806, 'stategy': 1, 'epoch': 2} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3335734214933513, 'r': 0.28507164804179574, 'f1': 0.3074212652482725}, 'combined': 0.19092478578576927, 'stategy': 1, 'epoch': 2} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3442776211104259, 'r': 0.3403579517998708, 'f1': 0.3423065660277327}, 'combined': 0.2522258907572767, 'stategy': 1, 'epoch': 2} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.32101106394999596, 'r': 0.2873541175813515, 'f1': 0.3032515792011966}, 'combined': 0.18833519129337475, 'stategy': 1, 'epoch': 2} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33685551847137524, 'r': 0.32471082235950405, 'f1': 0.3306716973593404}, 'combined': 0.24365282963319815, 'stategy': 1, 'epoch': 2} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34500193493964737, 'r': 0.2928940415084864, 'f1': 0.3168197160150526}, 'combined': 0.1967617183672432, 'stategy': 1, 'epoch': 2} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 2} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.36363636363636365, 'r': 0.5217391304347826, 'f1': 0.42857142857142855}, 'combined': 0.21428571428571427, 'stategy': 1, 'epoch': 2} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 2} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34074334029772785, 'r': 0.3536747763621578, 'f1': 0.34708865389731314}, 'combined': 0.2557495344506518, 'stategy': 1, 'epoch': 1} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33347831328300875, 'r': 0.2823515689122211, 'f1': 0.30579264720970056}, 'combined': 0.1899133282670772, 'stategy': 1, 'epoch': 1} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 1} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.35259574920970843, 'r': 0.339883568498163, 'f1': 0.34612297700199396}, 'combined': 0.2550379830541008, 'stategy': 1, 'epoch': 1} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31976221915024255, 'r': 0.2833896620757837, 'f1': 0.30047923267815135}, 'combined': 0.18661341818958874, 'stategy': 1, 'epoch': 1} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 1} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3422990007715465, 'r': 0.32281328915267293, 'f1': 0.3322707097333176}, 'combined': 0.24483104927718138, 'stategy': 1, 'epoch': 1} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34442683573720273, 'r': 0.2894000631638035, 'f1': 0.31452482748992144}, 'combined': 0.19533647180953018, 'stategy': 1, 'epoch': 1} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 1} ****************************** Epoch: 3 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 17:37:34.607963: step: 4/530, loss: 0.002227536402642727 2023-01-22 17:37:35.685528: step: 8/530, loss: 0.016790607944130898 2023-01-22 17:37:36.758141: step: 12/530, loss: 0.004460806958377361 2023-01-22 17:37:37.840234: step: 16/530, loss: 0.0032792179845273495 2023-01-22 17:37:38.910148: step: 20/530, loss: 0.003597506321966648 2023-01-22 17:37:39.990669: step: 24/530, loss: 0.010008974000811577 2023-01-22 17:37:41.090765: step: 28/530, loss: 0.009772967547178268 2023-01-22 17:37:42.174065: step: 32/530, loss: 0.009915060363709927 2023-01-22 17:37:43.280067: step: 36/530, loss: 0.006194828078150749 2023-01-22 17:37:44.392157: step: 40/530, loss: 0.00501536438241601 2023-01-22 17:37:45.492273: step: 44/530, loss: 0.006514077540487051 2023-01-22 17:37:46.598787: step: 48/530, loss: 0.013056674972176552 2023-01-22 17:37:47.673890: step: 52/530, loss: 0.0034928987734019756 2023-01-22 17:37:48.756926: step: 56/530, loss: 0.01233162172138691 2023-01-22 17:37:49.824459: step: 60/530, loss: 0.00442137848585844 2023-01-22 17:37:50.880164: step: 64/530, loss: 0.002346806926652789 2023-01-22 17:37:51.980168: step: 68/530, loss: 0.030737319961190224 2023-01-22 17:37:53.065418: step: 72/530, loss: 0.009473285637795925 2023-01-22 17:37:54.182123: step: 76/530, loss: 0.029489140957593918 2023-01-22 17:37:55.259174: step: 80/530, loss: 0.006130874156951904 2023-01-22 17:37:56.344014: step: 84/530, loss: 0.00369679881259799 2023-01-22 17:37:57.427200: step: 88/530, loss: 0.04161631315946579 2023-01-22 17:37:58.514622: step: 92/530, loss: 0.057136762887239456 2023-01-22 17:37:59.614449: step: 96/530, loss: 0.0024038327392190695 2023-01-22 17:38:00.730881: step: 100/530, loss: 0.006832140497863293 2023-01-22 17:38:01.811198: step: 104/530, loss: 0.04319263994693756 2023-01-22 17:38:02.917992: step: 108/530, loss: 0.007719225715845823 2023-01-22 17:38:04.031296: step: 112/530, loss: 0.03820951282978058 2023-01-22 17:38:05.111716: step: 116/530, loss: 0.007090891245752573 2023-01-22 17:38:06.198175: step: 120/530, loss: 0.0029282455798238516 2023-01-22 17:38:07.296841: step: 124/530, loss: 0.0031002552714198828 2023-01-22 17:38:08.369290: step: 128/530, loss: 0.01766994036734104 2023-01-22 17:38:09.486063: step: 132/530, loss: 0.10048720985651016 2023-01-22 17:38:10.578249: step: 136/530, loss: 0.007003552280366421 2023-01-22 17:38:11.654431: step: 140/530, loss: 0.0016844915226101875 2023-01-22 17:38:12.733500: step: 144/530, loss: 0.0023643632885068655 2023-01-22 17:38:13.827643: step: 148/530, loss: 0.004746571183204651 2023-01-22 17:38:14.927583: step: 152/530, loss: 0.004188341088593006 2023-01-22 17:38:16.031528: step: 156/530, loss: 0.013090483844280243 2023-01-22 17:38:17.137187: step: 160/530, loss: 0.0031739817932248116 2023-01-22 17:38:18.217757: step: 164/530, loss: 0.005898940376937389 2023-01-22 17:38:19.297336: step: 168/530, loss: 0.02599339932203293 2023-01-22 17:38:20.416285: step: 172/530, loss: 0.010433711111545563 2023-01-22 17:38:21.508895: step: 176/530, loss: 0.016894489526748657 2023-01-22 17:38:22.601161: step: 180/530, loss: 0.0037484883796423674 2023-01-22 17:38:23.717584: step: 184/530, loss: 0.040714994072914124 2023-01-22 17:38:24.805673: step: 188/530, loss: 0.00013284954184200615 2023-01-22 17:38:25.906673: step: 192/530, loss: 0.009761529043316841 2023-01-22 17:38:26.986482: step: 196/530, loss: 0.0040414780378341675 2023-01-22 17:38:28.085854: step: 200/530, loss: 0.0032499758526682854 2023-01-22 17:38:29.191845: step: 204/530, loss: 0.006838515866547823 2023-01-22 17:38:30.288523: step: 208/530, loss: 0.0016300976276397705 2023-01-22 17:38:31.375947: step: 212/530, loss: 0.017263047397136688 2023-01-22 17:38:32.484720: step: 216/530, loss: 0.005723776761442423 2023-01-22 17:38:33.563285: step: 220/530, loss: 0.007065284997224808 2023-01-22 17:38:34.683380: step: 224/530, loss: 0.0019440948963165283 2023-01-22 17:38:35.780425: step: 228/530, loss: 0.0034122595097869635 2023-01-22 17:38:36.881351: step: 232/530, loss: 0.014555097557604313 2023-01-22 17:38:37.976791: step: 236/530, loss: 0.029644416645169258 2023-01-22 17:38:39.068171: step: 240/530, loss: 0.009609824046492577 2023-01-22 17:38:40.168056: step: 244/530, loss: 0.00654362328350544 2023-01-22 17:38:41.317602: step: 248/530, loss: 0.061627987772226334 2023-01-22 17:38:42.411341: step: 252/530, loss: 0.03641989454627037 2023-01-22 17:38:43.510672: step: 256/530, loss: 0.004374881274998188 2023-01-22 17:38:44.636318: step: 260/530, loss: 0.030204875394701958 2023-01-22 17:38:45.725382: step: 264/530, loss: 0.004012828227132559 2023-01-22 17:38:46.820798: step: 268/530, loss: 0.006058164872229099 2023-01-22 17:38:47.909867: step: 272/530, loss: 0.002543671755120158 2023-01-22 17:38:48.998038: step: 276/530, loss: 0.006091054528951645 2023-01-22 17:38:50.118353: step: 280/530, loss: 0.024719322100281715 2023-01-22 17:38:51.204842: step: 284/530, loss: 0.014802731573581696 2023-01-22 17:38:52.342345: step: 288/530, loss: 0.014300837181508541 2023-01-22 17:38:53.457644: step: 292/530, loss: 0.009814117103815079 2023-01-22 17:38:54.572053: step: 296/530, loss: 0.0059904539957642555 2023-01-22 17:38:55.670522: step: 300/530, loss: 0.023650934919714928 2023-01-22 17:38:56.753400: step: 304/530, loss: 0.009037637151777744 2023-01-22 17:38:57.861559: step: 308/530, loss: 0.014698131009936333 2023-01-22 17:38:58.945467: step: 312/530, loss: 0.00847918912768364 2023-01-22 17:39:00.029327: step: 316/530, loss: 0.01754039339721203 2023-01-22 17:39:01.096404: step: 320/530, loss: 0.00804224144667387 2023-01-22 17:39:02.192947: step: 324/530, loss: 0.005646221339702606 2023-01-22 17:39:03.296941: step: 328/530, loss: 0.004300011321902275 2023-01-22 17:39:04.420384: step: 332/530, loss: 0.005537185352295637 2023-01-22 17:39:05.499617: step: 336/530, loss: 0.012691509909927845 2023-01-22 17:39:06.584408: step: 340/530, loss: 0.009244035929441452 2023-01-22 17:39:07.667781: step: 344/530, loss: 0.003927251324057579 2023-01-22 17:39:08.754453: step: 348/530, loss: 0.011134376749396324 2023-01-22 17:39:09.855241: step: 352/530, loss: 0.009228087030351162 2023-01-22 17:39:10.939999: step: 356/530, loss: 0.005150577053427696 2023-01-22 17:39:12.055729: step: 360/530, loss: 0.006937472149729729 2023-01-22 17:39:13.148186: step: 364/530, loss: 0.0025320244021713734 2023-01-22 17:39:14.219379: step: 368/530, loss: 0.009534927085042 2023-01-22 17:39:15.335661: step: 372/530, loss: 0.00988983828574419 2023-01-22 17:39:16.440749: step: 376/530, loss: 0.004799413960427046 2023-01-22 17:39:17.523457: step: 380/530, loss: 0.004854446742683649 2023-01-22 17:39:18.609458: step: 384/530, loss: 0.0008865715935826302 2023-01-22 17:39:19.742853: step: 388/530, loss: 0.010974948294460773 2023-01-22 17:39:20.836489: step: 392/530, loss: 0.005058357026427984 2023-01-22 17:39:21.929319: step: 396/530, loss: 0.0010100967483595014 2023-01-22 17:39:23.023866: step: 400/530, loss: 0.019582092761993408 2023-01-22 17:39:24.115072: step: 404/530, loss: 0.0027957975398749113 2023-01-22 17:39:25.221286: step: 408/530, loss: 0.009675396606326103 2023-01-22 17:39:26.313406: step: 412/530, loss: 0.005329884588718414 2023-01-22 17:39:27.427264: step: 416/530, loss: 0.010127348825335503 2023-01-22 17:39:28.528783: step: 420/530, loss: 0.006457071285694838 2023-01-22 17:39:29.628776: step: 424/530, loss: 0.029611095786094666 2023-01-22 17:39:30.749107: step: 428/530, loss: 0.015631312504410744 2023-01-22 17:39:31.832279: step: 432/530, loss: 0.006112556904554367 2023-01-22 17:39:32.938113: step: 436/530, loss: 0.0060873571783304214 2023-01-22 17:39:34.025732: step: 440/530, loss: 0.002243014285340905 2023-01-22 17:39:35.118165: step: 444/530, loss: 0.01817476376891136 2023-01-22 17:39:36.217464: step: 448/530, loss: 0.00849417969584465 2023-01-22 17:39:37.315023: step: 452/530, loss: 0.005257307086139917 2023-01-22 17:39:38.414946: step: 456/530, loss: 0.005071935709565878 2023-01-22 17:39:39.512374: step: 460/530, loss: 0.007713960018008947 2023-01-22 17:39:40.613296: step: 464/530, loss: 0.0037115723825991154 2023-01-22 17:39:41.701792: step: 468/530, loss: 0.0075607746839523315 2023-01-22 17:39:42.799922: step: 472/530, loss: 0.008396073244512081 2023-01-22 17:39:43.910099: step: 476/530, loss: 0.003240798832848668 2023-01-22 17:39:44.981249: step: 480/530, loss: 0.0022829517256468534 2023-01-22 17:39:46.097152: step: 484/530, loss: 0.0071618156507611275 2023-01-22 17:39:47.200885: step: 488/530, loss: 0.0022120859939604998 2023-01-22 17:39:48.282758: step: 492/530, loss: 0.005249615292996168 2023-01-22 17:39:49.374656: step: 496/530, loss: 0.008912590332329273 2023-01-22 17:39:50.490815: step: 500/530, loss: 0.004269557073712349 2023-01-22 17:39:51.574915: step: 504/530, loss: 0.004679122939705849 2023-01-22 17:39:52.675177: step: 508/530, loss: 0.002990277949720621 2023-01-22 17:39:53.777570: step: 512/530, loss: 0.008443482220172882 2023-01-22 17:39:54.887510: step: 516/530, loss: 0.002614922821521759 2023-01-22 17:39:55.972666: step: 520/530, loss: 0.015633730217814445 2023-01-22 17:39:57.083721: step: 524/530, loss: 0.010473628528416157 2023-01-22 17:39:58.174861: step: 528/530, loss: 0.0025497088208794594 2023-01-22 17:39:59.259448: step: 532/530, loss: 0.0094808554276824 2023-01-22 17:40:00.363463: step: 536/530, loss: 0.03716466948390007 2023-01-22 17:40:01.460632: step: 540/530, loss: 0.00557212857529521 2023-01-22 17:40:02.571390: step: 544/530, loss: 0.009412577375769615 2023-01-22 17:40:03.652181: step: 548/530, loss: 0.013018887490034103 2023-01-22 17:40:04.755569: step: 552/530, loss: 0.008328845724463463 2023-01-22 17:40:05.825794: step: 556/530, loss: 0.005064348690211773 2023-01-22 17:40:06.922559: step: 560/530, loss: 0.006493042688816786 2023-01-22 17:40:08.038690: step: 564/530, loss: 0.013318916782736778 2023-01-22 17:40:09.150735: step: 568/530, loss: 0.005416987929493189 2023-01-22 17:40:10.232980: step: 572/530, loss: 0.006717041600495577 2023-01-22 17:40:11.331340: step: 576/530, loss: 0.0030994806438684464 2023-01-22 17:40:12.452975: step: 580/530, loss: 0.006757744122296572 2023-01-22 17:40:13.542116: step: 584/530, loss: 0.008027574978768826 2023-01-22 17:40:14.656535: step: 588/530, loss: 0.007547580637037754 2023-01-22 17:40:15.745703: step: 592/530, loss: 0.0038620911072939634 2023-01-22 17:40:16.859703: step: 596/530, loss: 0.006576234009116888 2023-01-22 17:40:17.938176: step: 600/530, loss: 0.009168741293251514 2023-01-22 17:40:19.026399: step: 604/530, loss: 0.008811403065919876 2023-01-22 17:40:20.123786: step: 608/530, loss: 0.006936532910913229 2023-01-22 17:40:21.218906: step: 612/530, loss: 0.011735818348824978 2023-01-22 17:40:22.312246: step: 616/530, loss: 0.04981715977191925 2023-01-22 17:40:23.412598: step: 620/530, loss: 0.016454385593533516 2023-01-22 17:40:24.494340: step: 624/530, loss: 0.030957506969571114 2023-01-22 17:40:25.609388: step: 628/530, loss: 0.0008294227300211787 2023-01-22 17:40:26.714021: step: 632/530, loss: 0.01704142801463604 2023-01-22 17:40:27.817824: step: 636/530, loss: 0.02974986471235752 2023-01-22 17:40:28.901169: step: 640/530, loss: 0.004496879409998655 2023-01-22 17:40:29.982561: step: 644/530, loss: 0.0016910843551158905 2023-01-22 17:40:31.059520: step: 648/530, loss: 0.008565268479287624 2023-01-22 17:40:32.175337: step: 652/530, loss: 0.01379690133035183 2023-01-22 17:40:33.264244: step: 656/530, loss: 0.010884171351790428 2023-01-22 17:40:34.356897: step: 660/530, loss: 0.009911797009408474 2023-01-22 17:40:35.446393: step: 664/530, loss: 0.0036713872104883194 2023-01-22 17:40:36.525537: step: 668/530, loss: 0.015017013065516949 2023-01-22 17:40:37.610489: step: 672/530, loss: 0.01850060746073723 2023-01-22 17:40:38.693956: step: 676/530, loss: 0.028786921873688698 2023-01-22 17:40:39.782272: step: 680/530, loss: 0.004183605313301086 2023-01-22 17:40:40.880712: step: 684/530, loss: 0.0015425084857270122 2023-01-22 17:40:42.027256: step: 688/530, loss: 0.006054719444364309 2023-01-22 17:40:43.154970: step: 692/530, loss: 0.0034743899013847113 2023-01-22 17:40:44.253563: step: 696/530, loss: 0.00018592907872516662 2023-01-22 17:40:45.360027: step: 700/530, loss: 0.007415073923766613 2023-01-22 17:40:46.468824: step: 704/530, loss: 0.006361925508826971 2023-01-22 17:40:47.558531: step: 708/530, loss: 0.0045522344298660755 2023-01-22 17:40:48.649601: step: 712/530, loss: 0.005137616768479347 2023-01-22 17:40:49.711411: step: 716/530, loss: 0.003768669441342354 2023-01-22 17:40:50.796682: step: 720/530, loss: 0.0023649167269468307 2023-01-22 17:40:51.869969: step: 724/530, loss: 0.0017330496339127421 2023-01-22 17:40:52.950055: step: 728/530, loss: 0.0021172247361391783 2023-01-22 17:40:54.048052: step: 732/530, loss: 0.00999140739440918 2023-01-22 17:40:55.127081: step: 736/530, loss: 0.0037728685420006514 2023-01-22 17:40:56.217291: step: 740/530, loss: 0.009008875116705894 2023-01-22 17:40:57.340451: step: 744/530, loss: 0.003614150919020176 2023-01-22 17:40:58.421658: step: 748/530, loss: 0.013678636401891708 2023-01-22 17:40:59.514609: step: 752/530, loss: 0.0148874931037426 2023-01-22 17:41:00.623980: step: 756/530, loss: 0.011193053796887398 2023-01-22 17:41:01.712145: step: 760/530, loss: 0.007567123509943485 2023-01-22 17:41:02.815578: step: 764/530, loss: 0.0033964584581553936 2023-01-22 17:41:03.887675: step: 768/530, loss: 0.013261942192912102 2023-01-22 17:41:04.987859: step: 772/530, loss: 0.00231935759074986 2023-01-22 17:41:06.079365: step: 776/530, loss: 0.00519409216940403 2023-01-22 17:41:07.189296: step: 780/530, loss: 0.007931515574455261 2023-01-22 17:41:08.282919: step: 784/530, loss: 0.005752062890678644 2023-01-22 17:41:09.358049: step: 788/530, loss: 0.0019751957152038813 2023-01-22 17:41:10.446802: step: 792/530, loss: 0.008055678568780422 2023-01-22 17:41:11.538215: step: 796/530, loss: 0.008411243557929993 2023-01-22 17:41:12.652673: step: 800/530, loss: 0.003742727916687727 2023-01-22 17:41:13.726945: step: 804/530, loss: 0.004822937306016684 2023-01-22 17:41:14.794116: step: 808/530, loss: 0.0022399635054171085 2023-01-22 17:41:15.895149: step: 812/530, loss: 0.019668443128466606 2023-01-22 17:41:16.967855: step: 816/530, loss: 0.0051964991725981236 2023-01-22 17:41:18.070993: step: 820/530, loss: 0.018342772498726845 2023-01-22 17:41:19.163315: step: 824/530, loss: 0.0077751497738063335 2023-01-22 17:41:20.266483: step: 828/530, loss: 0.006631223019212484 2023-01-22 17:41:21.345908: step: 832/530, loss: 0.0105736143887043 2023-01-22 17:41:22.437591: step: 836/530, loss: 0.0051844073459506035 2023-01-22 17:41:23.519264: step: 840/530, loss: 0.007381302770227194 2023-01-22 17:41:24.607342: step: 844/530, loss: 0.0031810072250664234 2023-01-22 17:41:25.688000: step: 848/530, loss: 0.008050918579101562 2023-01-22 17:41:26.785020: step: 852/530, loss: 0.013539256528019905 2023-01-22 17:41:27.862860: step: 856/530, loss: 0.013206942938268185 2023-01-22 17:41:28.953598: step: 860/530, loss: 0.0062510352581739426 2023-01-22 17:41:30.036190: step: 864/530, loss: 0.008488173596560955 2023-01-22 17:41:31.149245: step: 868/530, loss: 0.008705228567123413 2023-01-22 17:41:32.262377: step: 872/530, loss: 0.020819269120693207 2023-01-22 17:41:33.360466: step: 876/530, loss: 0.0020449236035346985 2023-01-22 17:41:34.444838: step: 880/530, loss: 0.014308874495327473 2023-01-22 17:41:35.531886: step: 884/530, loss: 0.0024342637043446302 2023-01-22 17:41:36.607471: step: 888/530, loss: 0.008903756737709045 2023-01-22 17:41:37.670829: step: 892/530, loss: 0.02250978909432888 2023-01-22 17:41:38.784867: step: 896/530, loss: 0.003295569447800517 2023-01-22 17:41:39.887803: step: 900/530, loss: 0.007382961921393871 2023-01-22 17:41:40.967686: step: 904/530, loss: 0.003065861063078046 2023-01-22 17:41:42.044686: step: 908/530, loss: 0.010868741199374199 2023-01-22 17:41:43.148636: step: 912/530, loss: 0.004745489917695522 2023-01-22 17:41:44.235260: step: 916/530, loss: 0.01935676485300064 2023-01-22 17:41:45.324384: step: 920/530, loss: 0.011972932144999504 2023-01-22 17:41:46.407211: step: 924/530, loss: 0.00022512185387313366 2023-01-22 17:41:47.504522: step: 928/530, loss: 0.010233130306005478 2023-01-22 17:41:48.574921: step: 932/530, loss: 0.0018110991222783923 2023-01-22 17:41:49.657818: step: 936/530, loss: 0.007435475941747427 2023-01-22 17:41:50.732672: step: 940/530, loss: 0.002791812876239419 2023-01-22 17:41:51.832892: step: 944/530, loss: 0.004688797052949667 2023-01-22 17:41:52.919570: step: 948/530, loss: 0.005692686419934034 2023-01-22 17:41:54.016171: step: 952/530, loss: 0.018047353252768517 2023-01-22 17:41:55.111268: step: 956/530, loss: 0.0005185452173464 2023-01-22 17:41:56.227265: step: 960/530, loss: 0.04479311406612396 2023-01-22 17:41:57.310687: step: 964/530, loss: 0.038241881877183914 2023-01-22 17:41:58.404782: step: 968/530, loss: 0.009267397224903107 2023-01-22 17:41:59.474495: step: 972/530, loss: 0.0055338190868496895 2023-01-22 17:42:00.546370: step: 976/530, loss: 0.003924527671188116 2023-01-22 17:42:01.636414: step: 980/530, loss: 0.004754830151796341 2023-01-22 17:42:02.727011: step: 984/530, loss: 0.03573412075638771 2023-01-22 17:42:03.811932: step: 988/530, loss: 0.008589028380811214 2023-01-22 17:42:04.883057: step: 992/530, loss: 0.006674485746771097 2023-01-22 17:42:05.968255: step: 996/530, loss: 0.0007309062057174742 2023-01-22 17:42:07.089501: step: 1000/530, loss: 0.013067721389234066 2023-01-22 17:42:08.170896: step: 1004/530, loss: 0.012321450747549534 2023-01-22 17:42:09.240438: step: 1008/530, loss: 0.011038108728826046 2023-01-22 17:42:10.318617: step: 1012/530, loss: 0.015308350324630737 2023-01-22 17:42:11.415063: step: 1016/530, loss: 0.00011961118434555829 2023-01-22 17:42:12.544930: step: 1020/530, loss: 0.006224613171070814 2023-01-22 17:42:13.642124: step: 1024/530, loss: 0.006144258659332991 2023-01-22 17:42:14.757332: step: 1028/530, loss: 0.004497601184993982 2023-01-22 17:42:15.841665: step: 1032/530, loss: 0.007542679086327553 2023-01-22 17:42:16.931385: step: 1036/530, loss: 0.0030587154906243086 2023-01-22 17:42:18.017172: step: 1040/530, loss: 0.00018483679741621017 2023-01-22 17:42:19.109144: step: 1044/530, loss: 0.007949182763695717 2023-01-22 17:42:20.212989: step: 1048/530, loss: 0.04049225151538849 2023-01-22 17:42:21.292878: step: 1052/530, loss: 0.035482801496982574 2023-01-22 17:42:22.384045: step: 1056/530, loss: 0.0017006665002554655 2023-01-22 17:42:23.473801: step: 1060/530, loss: 0.05259407311677933 2023-01-22 17:42:24.567235: step: 1064/530, loss: 0.010258263908326626 2023-01-22 17:42:25.673427: step: 1068/530, loss: 0.004466751124709845 2023-01-22 17:42:26.747643: step: 1072/530, loss: 0.01392581406980753 2023-01-22 17:42:27.825937: step: 1076/530, loss: 0.0017227617790922523 2023-01-22 17:42:28.932149: step: 1080/530, loss: 0.004666168242692947 2023-01-22 17:42:30.029973: step: 1084/530, loss: 0.010201828554272652 2023-01-22 17:42:31.120715: step: 1088/530, loss: 0.0020840181969106197 2023-01-22 17:42:32.186902: step: 1092/530, loss: 0.005235451273620129 2023-01-22 17:42:33.269592: step: 1096/530, loss: 0.013133256696164608 2023-01-22 17:42:34.362796: step: 1100/530, loss: 0.020084798336029053 2023-01-22 17:42:35.460250: step: 1104/530, loss: 0.009468114003539085 2023-01-22 17:42:36.563636: step: 1108/530, loss: 0.00959616620093584 2023-01-22 17:42:37.677945: step: 1112/530, loss: 0.007817719131708145 2023-01-22 17:42:38.771711: step: 1116/530, loss: 0.011656277813017368 2023-01-22 17:42:39.874985: step: 1120/530, loss: 0.03768749535083771 2023-01-22 17:42:40.973594: step: 1124/530, loss: 0.0026087763253599405 2023-01-22 17:42:42.075740: step: 1128/530, loss: 0.024585768580436707 2023-01-22 17:42:43.143669: step: 1132/530, loss: 0.010689685121178627 2023-01-22 17:42:44.250313: step: 1136/530, loss: 0.010371686890721321 2023-01-22 17:42:45.348691: step: 1140/530, loss: 0.011005585081875324 2023-01-22 17:42:46.433374: step: 1144/530, loss: 0.005857882089912891 2023-01-22 17:42:47.516165: step: 1148/530, loss: 0.004124849569052458 2023-01-22 17:42:48.617520: step: 1152/530, loss: 1.5140353752940428e-06 2023-01-22 17:42:49.704128: step: 1156/530, loss: 0.012998753227293491 2023-01-22 17:42:50.792760: step: 1160/530, loss: 0.003946313168853521 2023-01-22 17:42:51.900339: step: 1164/530, loss: 0.029805080965161324 2023-01-22 17:42:53.006125: step: 1168/530, loss: 0.006880226545035839 2023-01-22 17:42:54.113489: step: 1172/530, loss: 0.08833377063274384 2023-01-22 17:42:55.198485: step: 1176/530, loss: 0.004376439843326807 2023-01-22 17:42:56.294476: step: 1180/530, loss: 0.02380470745265484 2023-01-22 17:42:57.372396: step: 1184/530, loss: 0.012658650055527687 2023-01-22 17:42:58.471276: step: 1188/530, loss: 0.008989873342216015 2023-01-22 17:42:59.544066: step: 1192/530, loss: 0.0018720749067142606 2023-01-22 17:43:00.632558: step: 1196/530, loss: 0.004735585767775774 2023-01-22 17:43:01.731574: step: 1200/530, loss: 0.02861524559557438 2023-01-22 17:43:02.821154: step: 1204/530, loss: 0.006515833083540201 2023-01-22 17:43:03.895773: step: 1208/530, loss: 0.0020132747013121843 2023-01-22 17:43:04.994930: step: 1212/530, loss: 0.0008755850722081959 2023-01-22 17:43:06.081579: step: 1216/530, loss: 7.4505797087454084e-09 2023-01-22 17:43:07.157546: step: 1220/530, loss: 0.06438211351633072 2023-01-22 17:43:08.242417: step: 1224/530, loss: 0.04198005422949791 2023-01-22 17:43:09.313879: step: 1228/530, loss: 0.0 2023-01-22 17:43:10.406777: step: 1232/530, loss: 0.00632608262822032 2023-01-22 17:43:11.498876: step: 1236/530, loss: 0.02386266179382801 2023-01-22 17:43:12.574408: step: 1240/530, loss: 0.005555871408432722 2023-01-22 17:43:13.672460: step: 1244/530, loss: 0.014315348118543625 2023-01-22 17:43:14.750552: step: 1248/530, loss: 0.02399740181863308 2023-01-22 17:43:15.838662: step: 1252/530, loss: 0.003911165986210108 2023-01-22 17:43:16.957893: step: 1256/530, loss: 0.00886138528585434 2023-01-22 17:43:18.042403: step: 1260/530, loss: 0.011854602955281734 2023-01-22 17:43:19.129982: step: 1264/530, loss: 0.02003047801554203 2023-01-22 17:43:20.226101: step: 1268/530, loss: 0.0033985127229243517 2023-01-22 17:43:21.316506: step: 1272/530, loss: 0.027946490794420242 2023-01-22 17:43:22.405215: step: 1276/530, loss: 0.0068738083355128765 2023-01-22 17:43:23.487229: step: 1280/530, loss: 0.004011850338429213 2023-01-22 17:43:24.589421: step: 1284/530, loss: 0.02610250562429428 2023-01-22 17:43:25.692179: step: 1288/530, loss: 0.01805303804576397 2023-01-22 17:43:26.763289: step: 1292/530, loss: 0.009144733659923077 2023-01-22 17:43:27.863783: step: 1296/530, loss: 0.004507117904722691 2023-01-22 17:43:28.992326: step: 1300/530, loss: 0.03221559897065163 2023-01-22 17:43:30.068574: step: 1304/530, loss: 0.0018386135343462229 2023-01-22 17:43:31.136887: step: 1308/530, loss: 0.006673126481473446 2023-01-22 17:43:32.231794: step: 1312/530, loss: 0.009045238606631756 2023-01-22 17:43:33.321812: step: 1316/530, loss: 0.0011634668335318565 2023-01-22 17:43:34.412899: step: 1320/530, loss: 0.004658046644181013 2023-01-22 17:43:35.503519: step: 1324/530, loss: 0.0025051843840628862 2023-01-22 17:43:36.593481: step: 1328/530, loss: 0.002556690014898777 2023-01-22 17:43:37.676260: step: 1332/530, loss: 0.0105762779712677 2023-01-22 17:43:38.767738: step: 1336/530, loss: 0.03093128465116024 2023-01-22 17:43:39.850456: step: 1340/530, loss: 0.006454716436564922 2023-01-22 17:43:40.930259: step: 1344/530, loss: 0.0022223638370633125 2023-01-22 17:43:42.039576: step: 1348/530, loss: 0.014794566668570042 2023-01-22 17:43:43.125579: step: 1352/530, loss: 0.006150797475129366 2023-01-22 17:43:44.212409: step: 1356/530, loss: 0.047473419457674026 2023-01-22 17:43:45.328496: step: 1360/530, loss: 0.009126752614974976 2023-01-22 17:43:46.430403: step: 1364/530, loss: 0.005281102377921343 2023-01-22 17:43:47.518627: step: 1368/530, loss: 0.03255490958690643 2023-01-22 17:43:48.635341: step: 1372/530, loss: 0.004429229535162449 2023-01-22 17:43:49.744941: step: 1376/530, loss: 0.030390240252017975 2023-01-22 17:43:50.847870: step: 1380/530, loss: 0.011396808549761772 2023-01-22 17:43:51.936645: step: 1384/530, loss: 0.02816726453602314 2023-01-22 17:43:53.036342: step: 1388/530, loss: 0.010108868591487408 2023-01-22 17:43:54.120869: step: 1392/530, loss: 0.0 2023-01-22 17:43:55.218093: step: 1396/530, loss: 0.0062020099721848965 2023-01-22 17:43:56.314473: step: 1400/530, loss: 0.03659898787736893 2023-01-22 17:43:57.386249: step: 1404/530, loss: 0.024742981418967247 2023-01-22 17:43:58.474158: step: 1408/530, loss: 0.0029463020619004965 2023-01-22 17:43:59.599093: step: 1412/530, loss: 0.055403999984264374 2023-01-22 17:44:00.705248: step: 1416/530, loss: 0.014414084143936634 2023-01-22 17:44:01.777099: step: 1420/530, loss: 4.377431469038129e-05 2023-01-22 17:44:02.875097: step: 1424/530, loss: 0.00045292737195268273 2023-01-22 17:44:03.947147: step: 1428/530, loss: 0.0013491526478901505 2023-01-22 17:44:05.040918: step: 1432/530, loss: 0.01840001344680786 2023-01-22 17:44:06.162026: step: 1436/530, loss: 0.009388620965182781 2023-01-22 17:44:07.244299: step: 1440/530, loss: 0.001821655547246337 2023-01-22 17:44:08.334543: step: 1444/530, loss: 0.008030835539102554 2023-01-22 17:44:09.426137: step: 1448/530, loss: 0.003816197859123349 2023-01-22 17:44:10.522941: step: 1452/530, loss: 0.009518238715827465 2023-01-22 17:44:11.585532: step: 1456/530, loss: 0.0078024608083069324 2023-01-22 17:44:12.665965: step: 1460/530, loss: 0.005686014890670776 2023-01-22 17:44:13.767024: step: 1464/530, loss: 0.008159623481333256 2023-01-22 17:44:14.862997: step: 1468/530, loss: 0.005434315651655197 2023-01-22 17:44:15.943174: step: 1472/530, loss: 0.00561576196923852 2023-01-22 17:44:17.033487: step: 1476/530, loss: 0.0095906313508749 2023-01-22 17:44:18.135884: step: 1480/530, loss: 0.017152147367596626 2023-01-22 17:44:19.208718: step: 1484/530, loss: 0.004590487573295832 2023-01-22 17:44:20.307955: step: 1488/530, loss: 0.0005239572492428124 2023-01-22 17:44:21.386753: step: 1492/530, loss: 0.004447967745363712 2023-01-22 17:44:22.473214: step: 1496/530, loss: 0.015526765026152134 2023-01-22 17:44:23.572526: step: 1500/530, loss: 0.051587581634521484 2023-01-22 17:44:24.659695: step: 1504/530, loss: 0.006166251376271248 2023-01-22 17:44:25.744617: step: 1508/530, loss: 0.005185808055102825 2023-01-22 17:44:26.852612: step: 1512/530, loss: 0.018353205174207687 2023-01-22 17:44:27.953816: step: 1516/530, loss: 0.029015248641371727 2023-01-22 17:44:29.025249: step: 1520/530, loss: 0.004135618451982737 2023-01-22 17:44:30.102151: step: 1524/530, loss: 0.0033073234371840954 2023-01-22 17:44:31.197604: step: 1528/530, loss: 0.002053049160167575 2023-01-22 17:44:32.294197: step: 1532/530, loss: 0.0036400973331183195 2023-01-22 17:44:33.393796: step: 1536/530, loss: 0.003317296039313078 2023-01-22 17:44:34.503417: step: 1540/530, loss: 0.004234801512211561 2023-01-22 17:44:35.586580: step: 1544/530, loss: 0.017313288524746895 2023-01-22 17:44:36.669766: step: 1548/530, loss: 0.012317666783928871 2023-01-22 17:44:37.767077: step: 1552/530, loss: 0.005927101708948612 2023-01-22 17:44:38.876524: step: 1556/530, loss: 0.0037845014594495296 2023-01-22 17:44:39.980015: step: 1560/530, loss: 0.008884548209607601 2023-01-22 17:44:41.075430: step: 1564/530, loss: 0.022238239645957947 2023-01-22 17:44:42.182850: step: 1568/530, loss: 0.012891136109828949 2023-01-22 17:44:43.268459: step: 1572/530, loss: 0.030476849526166916 2023-01-22 17:44:44.381714: step: 1576/530, loss: 0.0029098056256771088 2023-01-22 17:44:45.489920: step: 1580/530, loss: 0.01052937377244234 2023-01-22 17:44:46.593807: step: 1584/530, loss: 0.04979405179619789 2023-01-22 17:44:47.705239: step: 1588/530, loss: 0.0023765319492667913 2023-01-22 17:44:48.796612: step: 1592/530, loss: 0.004143412224948406 2023-01-22 17:44:49.890574: step: 1596/530, loss: 0.006798804271966219 2023-01-22 17:44:50.985938: step: 1600/530, loss: 0.009213268756866455 2023-01-22 17:44:52.073537: step: 1604/530, loss: 0.0126715749502182 2023-01-22 17:44:53.173986: step: 1608/530, loss: 0.05339021980762482 2023-01-22 17:44:54.265429: step: 1612/530, loss: 0.011374258436262608 2023-01-22 17:44:55.353324: step: 1616/530, loss: 0.005303275305777788 2023-01-22 17:44:56.452166: step: 1620/530, loss: 0.008439534343779087 2023-01-22 17:44:57.529830: step: 1624/530, loss: 0.003532485105097294 2023-01-22 17:44:58.606002: step: 1628/530, loss: 0.007714767009019852 2023-01-22 17:44:59.693297: step: 1632/530, loss: 0.005036373157054186 2023-01-22 17:45:00.798310: step: 1636/530, loss: 0.010950824245810509 2023-01-22 17:45:01.898523: step: 1640/530, loss: 0.0017168091144412756 2023-01-22 17:45:02.962775: step: 1644/530, loss: 0.019485170021653175 2023-01-22 17:45:04.050440: step: 1648/530, loss: 0.009485960006713867 2023-01-22 17:45:05.128309: step: 1652/530, loss: 0.005088926292955875 2023-01-22 17:45:06.215586: step: 1656/530, loss: 0.031124968081712723 2023-01-22 17:45:07.304385: step: 1660/530, loss: 0.028705941513180733 2023-01-22 17:45:08.394805: step: 1664/530, loss: 0.00893686804920435 2023-01-22 17:45:09.461549: step: 1668/530, loss: 0.002964981598779559 2023-01-22 17:45:10.542193: step: 1672/530, loss: 0.0036536783445626497 2023-01-22 17:45:11.631128: step: 1676/530, loss: 0.005702549125999212 2023-01-22 17:45:12.698766: step: 1680/530, loss: 0.012292525731027126 2023-01-22 17:45:13.805005: step: 1684/530, loss: 0.004351802170276642 2023-01-22 17:45:14.904607: step: 1688/530, loss: 0.006031625904142857 2023-01-22 17:45:15.985518: step: 1692/530, loss: 0.006322294473648071 2023-01-22 17:45:17.083357: step: 1696/530, loss: 0.007334110792726278 2023-01-22 17:45:18.191564: step: 1700/530, loss: 0.008161856792867184 2023-01-22 17:45:19.298801: step: 1704/530, loss: 0.01021916326135397 2023-01-22 17:45:20.396806: step: 1708/530, loss: 0.0014939174288883805 2023-01-22 17:45:21.473785: step: 1712/530, loss: 0.002128892345353961 2023-01-22 17:45:22.571215: step: 1716/530, loss: 0.01101960614323616 2023-01-22 17:45:23.660523: step: 1720/530, loss: 0.025418000295758247 2023-01-22 17:45:24.762899: step: 1724/530, loss: 0.013953392393887043 2023-01-22 17:45:25.860237: step: 1728/530, loss: 0.005516911391168833 2023-01-22 17:45:26.942668: step: 1732/530, loss: 0.005705171264708042 2023-01-22 17:45:28.025749: step: 1736/530, loss: 0.006698850076645613 2023-01-22 17:45:29.155157: step: 1740/530, loss: 0.0030481084249913692 2023-01-22 17:45:30.249538: step: 1744/530, loss: 0.014505933038890362 2023-01-22 17:45:31.323745: step: 1748/530, loss: 0.039191834628582 2023-01-22 17:45:32.413897: step: 1752/530, loss: 0.022778907790780067 2023-01-22 17:45:33.517885: step: 1756/530, loss: 0.00712298508733511 2023-01-22 17:45:34.600726: step: 1760/530, loss: 0.010292649269104004 2023-01-22 17:45:35.677479: step: 1764/530, loss: 0.004079221282154322 2023-01-22 17:45:36.772482: step: 1768/530, loss: 0.01893676444888115 2023-01-22 17:45:37.867047: step: 1772/530, loss: 0.0 2023-01-22 17:45:38.943788: step: 1776/530, loss: 0.005525399465113878 2023-01-22 17:45:40.049220: step: 1780/530, loss: 0.007351726293563843 2023-01-22 17:45:41.136992: step: 1784/530, loss: 0.0016253157518804073 2023-01-22 17:45:42.223786: step: 1788/530, loss: 0.004539277404546738 2023-01-22 17:45:43.348164: step: 1792/530, loss: 0.01693624258041382 2023-01-22 17:45:44.427994: step: 1796/530, loss: 0.0058190119452774525 2023-01-22 17:45:45.507778: step: 1800/530, loss: 0.009923038072884083 2023-01-22 17:45:46.588493: step: 1804/530, loss: 0.03290071710944176 2023-01-22 17:45:47.672068: step: 1808/530, loss: 0.003919346258044243 2023-01-22 17:45:48.753969: step: 1812/530, loss: 0.005124642513692379 2023-01-22 17:45:49.837929: step: 1816/530, loss: 0.0020729973912239075 2023-01-22 17:45:50.928896: step: 1820/530, loss: 0.005176374223083258 2023-01-22 17:45:52.015901: step: 1824/530, loss: 0.003863455494865775 2023-01-22 17:45:53.127482: step: 1828/530, loss: 0.0201641246676445 2023-01-22 17:45:54.247895: step: 1832/530, loss: 0.03788105025887489 2023-01-22 17:45:55.332507: step: 1836/530, loss: 0.0016798643628135324 2023-01-22 17:45:56.441280: step: 1840/530, loss: 0.016978899016976357 2023-01-22 17:45:57.556532: step: 1844/530, loss: 0.01821254752576351 2023-01-22 17:45:58.629012: step: 1848/530, loss: 0.0035666811745613813 2023-01-22 17:45:59.748740: step: 1852/530, loss: 0.1473417729139328 2023-01-22 17:46:00.830964: step: 1856/530, loss: 0.022895826026797295 2023-01-22 17:46:01.914725: step: 1860/530, loss: 0.004063081461936235 2023-01-22 17:46:02.986831: step: 1864/530, loss: 0.039851684123277664 2023-01-22 17:46:04.063882: step: 1868/530, loss: 0.013828875496983528 2023-01-22 17:46:05.140986: step: 1872/530, loss: 0.0001568260049680248 2023-01-22 17:46:06.221031: step: 1876/530, loss: 0.0032759520690888166 2023-01-22 17:46:07.322496: step: 1880/530, loss: 0.001493890886195004 2023-01-22 17:46:08.405982: step: 1884/530, loss: 0.0003120404726359993 2023-01-22 17:46:09.482997: step: 1888/530, loss: 0.00673631951212883 2023-01-22 17:46:10.595424: step: 1892/530, loss: 0.010273081250488758 2023-01-22 17:46:11.679977: step: 1896/530, loss: 0.0015573864802718163 2023-01-22 17:46:12.792332: step: 1900/530, loss: 0.010385089553892612 2023-01-22 17:46:13.871152: step: 1904/530, loss: 0.002454180736094713 2023-01-22 17:46:14.947204: step: 1908/530, loss: 0.002259141532704234 2023-01-22 17:46:16.027445: step: 1912/530, loss: 0.009372632019221783 2023-01-22 17:46:17.127896: step: 1916/530, loss: 0.01044060941785574 2023-01-22 17:46:18.220350: step: 1920/530, loss: 0.009234768338501453 2023-01-22 17:46:19.305510: step: 1924/530, loss: 0.0029348856769502163 2023-01-22 17:46:20.400055: step: 1928/530, loss: 0.0034264831338077784 2023-01-22 17:46:21.478460: step: 1932/530, loss: 0.018970796838402748 2023-01-22 17:46:22.567810: step: 1936/530, loss: 0.005571961402893066 2023-01-22 17:46:23.658105: step: 1940/530, loss: 0.002216230146586895 2023-01-22 17:46:24.775937: step: 1944/530, loss: 0.01605202630162239 2023-01-22 17:46:25.850903: step: 1948/530, loss: 0.005035205744206905 2023-01-22 17:46:26.932428: step: 1952/530, loss: 0.005195165518671274 2023-01-22 17:46:28.027427: step: 1956/530, loss: 0.004524275194853544 2023-01-22 17:46:29.123265: step: 1960/530, loss: 0.003987927455455065 2023-01-22 17:46:30.217540: step: 1964/530, loss: 0.010138333775103092 2023-01-22 17:46:31.301017: step: 1968/530, loss: 0.01195729710161686 2023-01-22 17:46:32.403733: step: 1972/530, loss: 0.03733308985829353 2023-01-22 17:46:33.507618: step: 1976/530, loss: 0.01076783612370491 2023-01-22 17:46:34.615727: step: 1980/530, loss: 0.020792188122868538 2023-01-22 17:46:35.700688: step: 1984/530, loss: 0.0 2023-01-22 17:46:36.830192: step: 1988/530, loss: 0.004448098596185446 2023-01-22 17:46:37.934122: step: 1992/530, loss: 0.007634727284312248 2023-01-22 17:46:39.022254: step: 1996/530, loss: 0.003218783298507333 2023-01-22 17:46:40.112491: step: 2000/530, loss: 0.0037025760393589735 2023-01-22 17:46:41.211799: step: 2004/530, loss: 0.005660674534738064 2023-01-22 17:46:42.274099: step: 2008/530, loss: 0.03520983085036278 2023-01-22 17:46:43.373565: step: 2012/530, loss: 0.012717806734144688 2023-01-22 17:46:44.479805: step: 2016/530, loss: 0.005978054832667112 2023-01-22 17:46:45.576087: step: 2020/530, loss: 0.004329439718276262 2023-01-22 17:46:46.667946: step: 2024/530, loss: 0.014939241111278534 2023-01-22 17:46:47.742112: step: 2028/530, loss: 0.027365699410438538 2023-01-22 17:46:48.832615: step: 2032/530, loss: 0.0020701545290648937 2023-01-22 17:46:49.922460: step: 2036/530, loss: 0.02141907624900341 2023-01-22 17:46:51.007125: step: 2040/530, loss: 0.011363283731043339 2023-01-22 17:46:52.092407: step: 2044/530, loss: 0.007223441265523434 2023-01-22 17:46:53.192344: step: 2048/530, loss: 0.012013864703476429 2023-01-22 17:46:54.288627: step: 2052/530, loss: 0.0017661800375208259 2023-01-22 17:46:55.360023: step: 2056/530, loss: 0.012152872048318386 2023-01-22 17:46:56.460877: step: 2060/530, loss: 0.004492082633078098 2023-01-22 17:46:57.546160: step: 2064/530, loss: 0.011100994423031807 2023-01-22 17:46:58.628530: step: 2068/530, loss: 0.01058836281299591 2023-01-22 17:46:59.722296: step: 2072/530, loss: 0.004957281518727541 2023-01-22 17:47:00.791285: step: 2076/530, loss: 0.0019252515630796552 2023-01-22 17:47:01.868389: step: 2080/530, loss: 0.01359036099165678 2023-01-22 17:47:02.961895: step: 2084/530, loss: 0.003083687974140048 2023-01-22 17:47:04.054671: step: 2088/530, loss: 0.013326723128557205 2023-01-22 17:47:05.153795: step: 2092/530, loss: 0.004173072054982185 2023-01-22 17:47:06.263511: step: 2096/530, loss: 0.055387236177921295 2023-01-22 17:47:07.354738: step: 2100/530, loss: 0.0202984306961298 2023-01-22 17:47:08.432550: step: 2104/530, loss: 0.0010682246647775173 2023-01-22 17:47:09.531214: step: 2108/530, loss: 0.02901669405400753 2023-01-22 17:47:10.635782: step: 2112/530, loss: 0.006395253352820873 2023-01-22 17:47:11.709264: step: 2116/530, loss: 0.0033668573014438152 2023-01-22 17:47:12.808533: step: 2120/530, loss: 0.010745705105364323 ================================================== Loss: 0.011 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34946305457735094, 'r': 0.3474737013254875, 'f1': 0.3484655387222301}, 'combined': 0.25676408116374844, 'stategy': 1, 'epoch': 3} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3180010973724229, 'r': 0.2903214766317966, 'f1': 0.3035315541620955}, 'combined': 0.1885090704796172, 'stategy': 1, 'epoch': 3} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34039493836931506, 'r': 0.331352188583413, 'f1': 0.33581269881434356}, 'combined': 0.24744093596846367, 'stategy': 1, 'epoch': 3} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3460110194391069, 'r': 0.2995574176190491, 'f1': 0.3211128720085679}, 'combined': 0.19942799419479482, 'stategy': 1, 'epoch': 3} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 3} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 3} New best chinese model... New best korean model... New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34946305457735094, 'r': 0.3474737013254875, 'f1': 0.3484655387222301}, 'combined': 0.25676408116374844, 'stategy': 1, 'epoch': 3} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3180010973724229, 'r': 0.2903214766317966, 'f1': 0.3035315541620955}, 'combined': 0.1885090704796172, 'stategy': 1, 'epoch': 3} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 3} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34039493836931506, 'r': 0.331352188583413, 'f1': 0.33581269881434356}, 'combined': 0.24744093596846367, 'stategy': 1, 'epoch': 3} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3460110194391069, 'r': 0.2995574176190491, 'f1': 0.3211128720085679}, 'combined': 0.19942799419479482, 'stategy': 1, 'epoch': 3} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 3} ****************************** Epoch: 4 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 17:50:04.615489: step: 4/530, loss: 0.09927669167518616 2023-01-22 17:50:05.717431: step: 8/530, loss: 0.005641601979732513 2023-01-22 17:50:06.787677: step: 12/530, loss: 0.0013777896529063582 2023-01-22 17:50:07.863020: step: 16/530, loss: 0.00665803300216794 2023-01-22 17:50:08.951437: step: 20/530, loss: 0.006408526562154293 2023-01-22 17:50:10.035312: step: 24/530, loss: 0.00570447975769639 2023-01-22 17:50:11.130842: step: 28/530, loss: 0.008242086507380009 2023-01-22 17:50:12.210678: step: 32/530, loss: 0.013434949330985546 2023-01-22 17:50:13.298566: step: 36/530, loss: 0.007572309114038944 2023-01-22 17:50:14.386878: step: 40/530, loss: 0.006733869668096304 2023-01-22 17:50:15.494635: step: 44/530, loss: 0.011334957554936409 2023-01-22 17:50:16.592578: step: 48/530, loss: 0.0306736771017313 2023-01-22 17:50:17.693749: step: 52/530, loss: 0.004868673160672188 2023-01-22 17:50:18.791003: step: 56/530, loss: 0.0037384810857474804 2023-01-22 17:50:19.902464: step: 60/530, loss: 0.01926356367766857 2023-01-22 17:50:20.996137: step: 64/530, loss: 0.025363925844430923 2023-01-22 17:50:22.083273: step: 68/530, loss: 0.004237812478095293 2023-01-22 17:50:23.168513: step: 72/530, loss: 0.0004058255290146917 2023-01-22 17:50:24.256170: step: 76/530, loss: 0.017811616882681847 2023-01-22 17:50:25.351016: step: 80/530, loss: 0.004367070738226175 2023-01-22 17:50:26.452481: step: 84/530, loss: 0.031310077756643295 2023-01-22 17:50:27.562976: step: 88/530, loss: 0.003796903882175684 2023-01-22 17:50:28.637661: step: 92/530, loss: 0.0005739496555179358 2023-01-22 17:50:29.717128: step: 96/530, loss: 0.004304783884435892 2023-01-22 17:50:30.806748: step: 100/530, loss: 0.004899375140666962 2023-01-22 17:50:31.917687: step: 104/530, loss: 0.008823595941066742 2023-01-22 17:50:33.006054: step: 108/530, loss: 0.0031449312809854746 2023-01-22 17:50:34.107826: step: 112/530, loss: 0.02087133377790451 2023-01-22 17:50:35.197291: step: 116/530, loss: 0.0010118724312633276 2023-01-22 17:50:36.301832: step: 120/530, loss: 0.030991574749350548 2023-01-22 17:50:37.386988: step: 124/530, loss: 0.002826171461492777 2023-01-22 17:50:38.458041: step: 128/530, loss: 0.03895251825451851 2023-01-22 17:50:39.549716: step: 132/530, loss: 0.04373853653669357 2023-01-22 17:50:40.632341: step: 136/530, loss: 0.006357408128678799 2023-01-22 17:50:41.714208: step: 140/530, loss: 0.011653343215584755 2023-01-22 17:50:42.796070: step: 144/530, loss: 0.004880918189883232 2023-01-22 17:50:43.878541: step: 148/530, loss: 0.00032929336884990335 2023-01-22 17:50:44.961158: step: 152/530, loss: 0.0033075911924242973 2023-01-22 17:50:46.055096: step: 156/530, loss: 0.002118311822414398 2023-01-22 17:50:47.153261: step: 160/530, loss: 0.008454743772745132 2023-01-22 17:50:48.240818: step: 164/530, loss: 0.0018689573043957353 2023-01-22 17:50:49.348580: step: 168/530, loss: 0.0064310599118471146 2023-01-22 17:50:50.434221: step: 172/530, loss: 0.004264505580067635 2023-01-22 17:50:51.546880: step: 176/530, loss: 0.002996481489390135 2023-01-22 17:50:52.625065: step: 180/530, loss: 0.010713724419474602 2023-01-22 17:50:53.710408: step: 184/530, loss: 0.04462990537285805 2023-01-22 17:50:54.815169: step: 188/530, loss: 0.0010316789848729968 2023-01-22 17:50:55.922390: step: 192/530, loss: 0.007205520290881395 2023-01-22 17:50:57.004889: step: 196/530, loss: 0.017558736726641655 2023-01-22 17:50:58.096619: step: 200/530, loss: 0.005804868880659342 2023-01-22 17:50:59.180034: step: 204/530, loss: 0.004413038957864046 2023-01-22 17:51:00.271532: step: 208/530, loss: 0.00911199115216732 2023-01-22 17:51:01.362072: step: 212/530, loss: 0.0032672162633389235 2023-01-22 17:51:02.482522: step: 216/530, loss: 0.00288008782081306 2023-01-22 17:51:03.599667: step: 220/530, loss: 0.0027356515638530254 2023-01-22 17:51:04.695998: step: 224/530, loss: 0.01759803667664528 2023-01-22 17:51:05.793383: step: 228/530, loss: 0.014631424099206924 2023-01-22 17:51:06.884798: step: 232/530, loss: 0.001528739696368575 2023-01-22 17:51:08.001367: step: 236/530, loss: 0.021075492724776268 2023-01-22 17:51:09.103734: step: 240/530, loss: 0.014439521357417107 2023-01-22 17:51:10.193484: step: 244/530, loss: 0.005400847643613815 2023-01-22 17:51:11.283438: step: 248/530, loss: 0.0009490182274021208 2023-01-22 17:51:12.406439: step: 252/530, loss: 0.007926997728645802 2023-01-22 17:51:13.512299: step: 256/530, loss: 0.0022545952815562487 2023-01-22 17:51:14.610602: step: 260/530, loss: 0.0029541002586483955 2023-01-22 17:51:15.713033: step: 264/530, loss: 0.008275289088487625 2023-01-22 17:51:16.803205: step: 268/530, loss: 0.0017798682674765587 2023-01-22 17:51:17.896986: step: 272/530, loss: 0.00442288164049387 2023-01-22 17:51:18.991072: step: 276/530, loss: 0.04807819053530693 2023-01-22 17:51:20.099289: step: 280/530, loss: 0.0024885369930416346 2023-01-22 17:51:21.209595: step: 284/530, loss: 0.0008520008996129036 2023-01-22 17:51:22.305193: step: 288/530, loss: 0.013537491671741009 2023-01-22 17:51:23.394863: step: 292/530, loss: 0.0036641217302531004 2023-01-22 17:51:24.481980: step: 296/530, loss: 0.07835936546325684 2023-01-22 17:51:25.592854: step: 300/530, loss: 0.006127417553216219 2023-01-22 17:51:26.712685: step: 304/530, loss: 0.014236005954444408 2023-01-22 17:51:27.802263: step: 308/530, loss: 0.001819130266085267 2023-01-22 17:51:28.887043: step: 312/530, loss: 0.006281946785748005 2023-01-22 17:51:30.030061: step: 316/530, loss: 0.0028561612125486135 2023-01-22 17:51:31.152463: step: 320/530, loss: 0.06220261752605438 2023-01-22 17:51:32.241876: step: 324/530, loss: 0.018125133588910103 2023-01-22 17:51:33.327802: step: 328/530, loss: 0.014507114887237549 2023-01-22 17:51:34.436340: step: 332/530, loss: 0.006403418257832527 2023-01-22 17:51:35.552288: step: 336/530, loss: 0.0008241086034104228 2023-01-22 17:51:36.641668: step: 340/530, loss: 0.012522955425083637 2023-01-22 17:51:37.735339: step: 344/530, loss: 0.028947046026587486 2023-01-22 17:51:38.831932: step: 348/530, loss: 0.0012344359420239925 2023-01-22 17:51:39.919709: step: 352/530, loss: 0.008961455896496773 2023-01-22 17:51:41.013990: step: 356/530, loss: 0.005826309788972139 2023-01-22 17:51:42.131263: step: 360/530, loss: 0.0023722576443105936 2023-01-22 17:51:43.240708: step: 364/530, loss: 0.001849903492256999 2023-01-22 17:51:44.336799: step: 368/530, loss: 0.010201117023825645 2023-01-22 17:51:45.424799: step: 372/530, loss: 0.007875319570302963 2023-01-22 17:51:46.525531: step: 376/530, loss: 0.014172296971082687 2023-01-22 17:51:47.600545: step: 380/530, loss: 0.009425021708011627 2023-01-22 17:51:48.698780: step: 384/530, loss: 0.004893010947853327 2023-01-22 17:51:49.778433: step: 388/530, loss: 0.0035306529607623816 2023-01-22 17:51:50.856330: step: 392/530, loss: 0.00699588842689991 2023-01-22 17:51:51.966290: step: 396/530, loss: 0.026883775368332863 2023-01-22 17:51:53.044921: step: 400/530, loss: 0.0 2023-01-22 17:51:54.139047: step: 404/530, loss: 0.003555327421054244 2023-01-22 17:51:55.245328: step: 408/530, loss: 0.001621041912585497 2023-01-22 17:51:56.356860: step: 412/530, loss: 0.0054182508029043674 2023-01-22 17:51:57.439603: step: 416/530, loss: 0.013784663751721382 2023-01-22 17:51:58.521728: step: 420/530, loss: 0.04009197652339935 2023-01-22 17:51:59.616561: step: 424/530, loss: 0.007577024400234222 2023-01-22 17:52:00.705998: step: 428/530, loss: 0.006525625940412283 2023-01-22 17:52:01.801077: step: 432/530, loss: 0.018196502700448036 2023-01-22 17:52:02.894941: step: 436/530, loss: 0.0001607575686648488 2023-01-22 17:52:04.017908: step: 440/530, loss: 0.002720220945775509 2023-01-22 17:52:05.126217: step: 444/530, loss: 0.014555196277797222 2023-01-22 17:52:06.198883: step: 448/530, loss: 0.0005303258076310158 2023-01-22 17:52:07.291324: step: 452/530, loss: 0.005635303445160389 2023-01-22 17:52:08.386694: step: 456/530, loss: 0.0011091685155406594 2023-01-22 17:52:09.489390: step: 460/530, loss: 0.006827346049249172 2023-01-22 17:52:10.601280: step: 464/530, loss: 0.008032244630157948 2023-01-22 17:52:11.703606: step: 468/530, loss: 0.006095521152019501 2023-01-22 17:52:12.808850: step: 472/530, loss: 0.028219925239682198 2023-01-22 17:52:13.882583: step: 476/530, loss: 0.002821669215336442 2023-01-22 17:52:15.015215: step: 480/530, loss: 0.0032214473467320204 2023-01-22 17:52:16.124528: step: 484/530, loss: 0.0027135361451655626 2023-01-22 17:52:17.235042: step: 488/530, loss: 0.010229124687612057 2023-01-22 17:52:18.352137: step: 492/530, loss: 0.012760784476995468 2023-01-22 17:52:19.445166: step: 496/530, loss: 0.01200017798691988 2023-01-22 17:52:20.526240: step: 500/530, loss: 0.00775990542024374 2023-01-22 17:52:21.624127: step: 504/530, loss: 0.004292254336178303 2023-01-22 17:52:22.734236: step: 508/530, loss: 0.005923712160438299 2023-01-22 17:52:23.862188: step: 512/530, loss: 0.04941634461283684 2023-01-22 17:52:24.956030: step: 516/530, loss: 0.06716771423816681 2023-01-22 17:52:26.056987: step: 520/530, loss: 0.005379937589168549 2023-01-22 17:52:27.143547: step: 524/530, loss: 0.002120907884091139 2023-01-22 17:52:28.244297: step: 528/530, loss: 0.009625289589166641 2023-01-22 17:52:29.317439: step: 532/530, loss: 0.0009129293612204492 2023-01-22 17:52:30.415630: step: 536/530, loss: 0.010262400843203068 2023-01-22 17:52:31.517043: step: 540/530, loss: 0.007930413819849491 2023-01-22 17:52:32.602927: step: 544/530, loss: 0.004497353918850422 2023-01-22 17:52:33.698267: step: 548/530, loss: 0.004900988657027483 2023-01-22 17:52:34.795341: step: 552/530, loss: 0.002976667834445834 2023-01-22 17:52:35.888946: step: 556/530, loss: 0.005632808431982994 2023-01-22 17:52:36.974071: step: 560/530, loss: 0.004273197613656521 2023-01-22 17:52:38.080144: step: 564/530, loss: 0.005485229194164276 2023-01-22 17:52:39.192541: step: 568/530, loss: 0.005553442519158125 2023-01-22 17:52:40.291549: step: 572/530, loss: 0.006116292905062437 2023-01-22 17:52:41.386713: step: 576/530, loss: 0.019503524526953697 2023-01-22 17:52:42.485690: step: 580/530, loss: 0.0014874463668093085 2023-01-22 17:52:43.609446: step: 584/530, loss: 0.0029542213305830956 2023-01-22 17:52:44.685634: step: 588/530, loss: 0.008017477579414845 2023-01-22 17:52:45.777926: step: 592/530, loss: 0.01405017077922821 2023-01-22 17:52:46.858955: step: 596/530, loss: 0.009267565794289112 2023-01-22 17:52:47.950384: step: 600/530, loss: 0.005587130319327116 2023-01-22 17:52:49.047407: step: 604/530, loss: 0.005893026012927294 2023-01-22 17:52:50.127497: step: 608/530, loss: 0.05462037771940231 2023-01-22 17:52:51.196357: step: 612/530, loss: 0.014503302052617073 2023-01-22 17:52:52.284794: step: 616/530, loss: 0.0021572366822510958 2023-01-22 17:52:53.385719: step: 620/530, loss: 0.030603861436247826 2023-01-22 17:52:54.490484: step: 624/530, loss: 0.025606010109186172 2023-01-22 17:52:55.573515: step: 628/530, loss: 0.012202084064483643 2023-01-22 17:52:56.664007: step: 632/530, loss: 0.006320464424788952 2023-01-22 17:52:57.764578: step: 636/530, loss: 0.01756983809173107 2023-01-22 17:52:58.856331: step: 640/530, loss: 0.013302707113325596 2023-01-22 17:52:59.926400: step: 644/530, loss: 0.0051459018141031265 2023-01-22 17:53:01.025604: step: 648/530, loss: 0.018608955666422844 2023-01-22 17:53:02.153496: step: 652/530, loss: 0.051968496292829514 2023-01-22 17:53:03.254997: step: 656/530, loss: 0.002816385356709361 2023-01-22 17:53:04.332824: step: 660/530, loss: 0.0011777845211327076 2023-01-22 17:53:05.423616: step: 664/530, loss: 0.05226266756653786 2023-01-22 17:53:06.498030: step: 668/530, loss: 0.0022365900222212076 2023-01-22 17:53:07.560896: step: 672/530, loss: 0.0017457716166973114 2023-01-22 17:53:08.656063: step: 676/530, loss: 0.004118798766285181 2023-01-22 17:53:09.766267: step: 680/530, loss: 0.007175061386078596 2023-01-22 17:53:10.864743: step: 684/530, loss: 0.0065866210497915745 2023-01-22 17:53:11.957588: step: 688/530, loss: 0.0046526906080543995 2023-01-22 17:53:13.063105: step: 692/530, loss: 0.013096659444272518 2023-01-22 17:53:14.143756: step: 696/530, loss: 0.0021525996271520853 2023-01-22 17:53:15.240351: step: 700/530, loss: 0.010530092753469944 2023-01-22 17:53:16.325902: step: 704/530, loss: 0.01911844126880169 2023-01-22 17:53:17.400571: step: 708/530, loss: 0.005516392178833485 2023-01-22 17:53:18.521984: step: 712/530, loss: 0.0376371368765831 2023-01-22 17:53:19.595681: step: 716/530, loss: 0.008230074308812618 2023-01-22 17:53:20.679212: step: 720/530, loss: 0.0011314211878925562 2023-01-22 17:53:21.781766: step: 724/530, loss: 0.005857103504240513 2023-01-22 17:53:22.861483: step: 728/530, loss: 0.006830296479165554 2023-01-22 17:53:23.950566: step: 732/530, loss: 0.037676043808460236 2023-01-22 17:53:25.060369: step: 736/530, loss: 0.00492482166737318 2023-01-22 17:53:26.171177: step: 740/530, loss: 0.006314415019005537 2023-01-22 17:53:27.245284: step: 744/530, loss: 0.0011559833073988557 2023-01-22 17:53:28.332813: step: 748/530, loss: 0.019396888092160225 2023-01-22 17:53:29.403554: step: 752/530, loss: 0.0035427967086434364 2023-01-22 17:53:30.486963: step: 756/530, loss: 0.004653621930629015 2023-01-22 17:53:31.560662: step: 760/530, loss: 0.04286370053887367 2023-01-22 17:53:32.654176: step: 764/530, loss: 0.004473235923796892 2023-01-22 17:53:33.752817: step: 768/530, loss: 0.0014295750297605991 2023-01-22 17:53:34.852189: step: 772/530, loss: 0.009321562945842743 2023-01-22 17:53:35.942229: step: 776/530, loss: 0.001998191000893712 2023-01-22 17:53:37.030131: step: 780/530, loss: 0.010920494794845581 2023-01-22 17:53:38.134756: step: 784/530, loss: 0.005064839031547308 2023-01-22 17:53:39.183357: step: 788/530, loss: 0.0026471298187971115 2023-01-22 17:53:40.262373: step: 792/530, loss: 0.007634473033249378 2023-01-22 17:53:41.354321: step: 796/530, loss: 0.0054195537231862545 2023-01-22 17:53:42.432209: step: 800/530, loss: 2.5632723918533884e-05 2023-01-22 17:53:43.504336: step: 804/530, loss: 0.0015481067821383476 2023-01-22 17:53:44.582718: step: 808/530, loss: 0.0013678346294909716 2023-01-22 17:53:45.648222: step: 812/530, loss: 3.655743785202503e-05 2023-01-22 17:53:46.741530: step: 816/530, loss: 0.0007711700745858252 2023-01-22 17:53:47.852186: step: 820/530, loss: 0.002734269481152296 2023-01-22 17:53:48.956154: step: 824/530, loss: 0.007342600263655186 2023-01-22 17:53:50.040976: step: 828/530, loss: 0.008949954062700272 2023-01-22 17:53:51.122597: step: 832/530, loss: 0.01913045346736908 2023-01-22 17:53:52.208254: step: 836/530, loss: 0.0058847409673035145 2023-01-22 17:53:53.292617: step: 840/530, loss: 0.0016242398414760828 2023-01-22 17:53:54.389043: step: 844/530, loss: 0.0 2023-01-22 17:53:55.461438: step: 848/530, loss: 0.003999742213636637 2023-01-22 17:53:56.553651: step: 852/530, loss: 0.010109375230967999 2023-01-22 17:53:57.640756: step: 856/530, loss: 0.00460029998794198 2023-01-22 17:53:58.746489: step: 860/530, loss: 0.0004871089186053723 2023-01-22 17:53:59.868267: step: 864/530, loss: 0.009708979167044163 2023-01-22 17:54:00.968252: step: 868/530, loss: 0.018177898600697517 2023-01-22 17:54:02.041692: step: 872/530, loss: 0.014271182008087635 2023-01-22 17:54:03.113615: step: 876/530, loss: 0.016332503408193588 2023-01-22 17:54:04.191693: step: 880/530, loss: 0.028696853667497635 2023-01-22 17:54:05.267528: step: 884/530, loss: 0.0019225645810365677 2023-01-22 17:54:06.345397: step: 888/530, loss: 0.006583839189261198 2023-01-22 17:54:07.434474: step: 892/530, loss: 0.01813540793955326 2023-01-22 17:54:08.539262: step: 896/530, loss: 0.002659044461324811 2023-01-22 17:54:09.647118: step: 900/530, loss: 0.007973596453666687 2023-01-22 17:54:10.722445: step: 904/530, loss: 0.000344327709171921 2023-01-22 17:54:11.825350: step: 908/530, loss: 0.0005181411979719996 2023-01-22 17:54:12.933772: step: 912/530, loss: 0.006515146233141422 2023-01-22 17:54:14.040926: step: 916/530, loss: 0.04089716821908951 2023-01-22 17:54:15.128661: step: 920/530, loss: 0.012362835928797722 2023-01-22 17:54:16.197410: step: 924/530, loss: 0.0032248373609036207 2023-01-22 17:54:17.289748: step: 928/530, loss: 0.0052716550417244434 2023-01-22 17:54:18.400310: step: 932/530, loss: 0.008960737846791744 2023-01-22 17:54:19.486731: step: 936/530, loss: 0.007722099777311087 2023-01-22 17:54:20.575552: step: 940/530, loss: 0.005386774893850088 2023-01-22 17:54:21.626953: step: 944/530, loss: 0.02466478943824768 2023-01-22 17:54:22.728508: step: 948/530, loss: 0.000699700671248138 2023-01-22 17:54:23.799620: step: 952/530, loss: 0.010090579278767109 2023-01-22 17:54:24.894960: step: 956/530, loss: 0.032206565141677856 2023-01-22 17:54:25.979218: step: 960/530, loss: 0.004933027550578117 2023-01-22 17:54:27.058942: step: 964/530, loss: 0.005204321350902319 2023-01-22 17:54:28.143812: step: 968/530, loss: 0.007158435881137848 2023-01-22 17:54:29.233892: step: 972/530, loss: 0.0004781386232934892 2023-01-22 17:54:30.315142: step: 976/530, loss: 0.007539019919931889 2023-01-22 17:54:31.421617: step: 980/530, loss: 0.028663285076618195 2023-01-22 17:54:32.509953: step: 984/530, loss: 0.0062734270468354225 2023-01-22 17:54:33.595874: step: 988/530, loss: 0.003907158505171537 2023-01-22 17:54:34.675232: step: 992/530, loss: 0.009708663448691368 2023-01-22 17:54:35.746592: step: 996/530, loss: 0.0015299940714612603 2023-01-22 17:54:36.846850: step: 1000/530, loss: 0.027635866776108742 2023-01-22 17:54:37.943869: step: 1004/530, loss: 0.019229024648666382 2023-01-22 17:54:39.052614: step: 1008/530, loss: 0.0019254639046266675 2023-01-22 17:54:40.145552: step: 1012/530, loss: 0.006283264607191086 2023-01-22 17:54:41.238647: step: 1016/530, loss: 0.010211851447820663 2023-01-22 17:54:42.307726: step: 1020/530, loss: 0.02226889505982399 2023-01-22 17:54:43.416519: step: 1024/530, loss: 0.011547621339559555 2023-01-22 17:54:44.506649: step: 1028/530, loss: 0.028978381305933 2023-01-22 17:54:45.605576: step: 1032/530, loss: 0.009371335618197918 2023-01-22 17:54:46.678408: step: 1036/530, loss: 0.004516514949500561 2023-01-22 17:54:47.765200: step: 1040/530, loss: 0.004802541807293892 2023-01-22 17:54:48.856719: step: 1044/530, loss: 0.004046474117785692 2023-01-22 17:54:49.938627: step: 1048/530, loss: 0.01412553247064352 2023-01-22 17:54:51.035197: step: 1052/530, loss: 0.031771283596754074 2023-01-22 17:54:52.108471: step: 1056/530, loss: 0.016401346772909164 2023-01-22 17:54:53.195444: step: 1060/530, loss: 0.005149469245225191 2023-01-22 17:54:54.300329: step: 1064/530, loss: 0.0051411353051662445 2023-01-22 17:54:55.414852: step: 1068/530, loss: 0.006421458441764116 2023-01-22 17:54:56.522082: step: 1072/530, loss: 0.005479373969137669 2023-01-22 17:54:57.627124: step: 1076/530, loss: 0.01687074452638626 2023-01-22 17:54:58.703881: step: 1080/530, loss: 0.01837819442152977 2023-01-22 17:54:59.789885: step: 1084/530, loss: 0.006419012788683176 2023-01-22 17:55:00.900152: step: 1088/530, loss: 0.21443110704421997 2023-01-22 17:55:02.003997: step: 1092/530, loss: 0.00515205692499876 2023-01-22 17:55:03.078518: step: 1096/530, loss: 0.014464744366705418 2023-01-22 17:55:04.179025: step: 1100/530, loss: 0.010988007299602032 2023-01-22 17:55:05.268100: step: 1104/530, loss: 0.012415298260748386 2023-01-22 17:55:06.347738: step: 1108/530, loss: 0.006238764151930809 2023-01-22 17:55:07.451527: step: 1112/530, loss: 0.006947832182049751 2023-01-22 17:55:08.521749: step: 1116/530, loss: 0.03296361863613129 2023-01-22 17:55:09.640674: step: 1120/530, loss: 0.04336675629019737 2023-01-22 17:55:10.699567: step: 1124/530, loss: 0.005384029820561409 2023-01-22 17:55:11.820678: step: 1128/530, loss: 0.001848328742198646 2023-01-22 17:55:12.911854: step: 1132/530, loss: 0.005821629893034697 2023-01-22 17:55:14.002340: step: 1136/530, loss: 0.0011691212421283126 2023-01-22 17:55:15.084049: step: 1140/530, loss: 0.0023401067592203617 2023-01-22 17:55:16.172511: step: 1144/530, loss: 0.011342565529048443 2023-01-22 17:55:17.294151: step: 1148/530, loss: 0.03706418722867966 2023-01-22 17:55:18.370322: step: 1152/530, loss: 0.008639579638838768 2023-01-22 17:55:19.447116: step: 1156/530, loss: 0.00441003916785121 2023-01-22 17:55:20.529715: step: 1160/530, loss: 0.015135018154978752 2023-01-22 17:55:21.638649: step: 1164/530, loss: 0.003957340959459543 2023-01-22 17:55:22.704861: step: 1168/530, loss: 0.010271869599819183 2023-01-22 17:55:23.808561: step: 1172/530, loss: 0.007644107099622488 2023-01-22 17:55:24.891943: step: 1176/530, loss: 0.04006931558251381 2023-01-22 17:55:25.986186: step: 1180/530, loss: 0.02148464135825634 2023-01-22 17:55:27.064225: step: 1184/530, loss: 0.006408920977264643 2023-01-22 17:55:28.159797: step: 1188/530, loss: 0.00384511798620224 2023-01-22 17:55:29.267982: step: 1192/530, loss: 0.03347256779670715 2023-01-22 17:55:30.364612: step: 1196/530, loss: 0.005603414494544268 2023-01-22 17:55:31.453224: step: 1200/530, loss: 0.007562906481325626 2023-01-22 17:55:32.556537: step: 1204/530, loss: 0.0015090858796611428 2023-01-22 17:55:33.657002: step: 1208/530, loss: 0.017365990206599236 2023-01-22 17:55:34.755745: step: 1212/530, loss: 0.008800257928669453 2023-01-22 17:55:35.842305: step: 1216/530, loss: 0.005413127597421408 2023-01-22 17:55:36.946160: step: 1220/530, loss: 0.0047996509820222855 2023-01-22 17:55:38.021235: step: 1224/530, loss: 0.022756759077310562 2023-01-22 17:55:39.091093: step: 1228/530, loss: 0.006855475716292858 2023-01-22 17:55:40.155833: step: 1232/530, loss: 0.020436810329556465 2023-01-22 17:55:41.242676: step: 1236/530, loss: 0.04669833183288574 2023-01-22 17:55:42.342259: step: 1240/530, loss: 0.011487391777336597 2023-01-22 17:55:43.446927: step: 1244/530, loss: 0.01739269308745861 2023-01-22 17:55:44.517256: step: 1248/530, loss: 0.031075118109583855 2023-01-22 17:55:45.596678: step: 1252/530, loss: 0.010184599086642265 2023-01-22 17:55:46.686476: step: 1256/530, loss: 0.007033254485577345 2023-01-22 17:55:47.783429: step: 1260/530, loss: 0.005699960980564356 2023-01-22 17:55:48.878265: step: 1264/530, loss: 0.007377345114946365 2023-01-22 17:55:49.988839: step: 1268/530, loss: 0.01987394690513611 2023-01-22 17:55:51.085627: step: 1272/530, loss: 0.0006842540460638702 2023-01-22 17:55:52.169830: step: 1276/530, loss: 0.07761415094137192 2023-01-22 17:55:53.257332: step: 1280/530, loss: 0.0015428510960191488 2023-01-22 17:55:54.348565: step: 1284/530, loss: 0.002973944880068302 2023-01-22 17:55:55.476970: step: 1288/530, loss: 0.015504645183682442 2023-01-22 17:55:56.593780: step: 1292/530, loss: 0.0063639418222010136 2023-01-22 17:55:57.686316: step: 1296/530, loss: 0.008862471207976341 2023-01-22 17:55:58.798220: step: 1300/530, loss: 0.0045169140212237835 2023-01-22 17:55:59.882332: step: 1304/530, loss: 0.004776623100042343 2023-01-22 17:56:00.970247: step: 1308/530, loss: 0.006416270975023508 2023-01-22 17:56:02.065291: step: 1312/530, loss: 0.027517270296812057 2023-01-22 17:56:03.192720: step: 1316/530, loss: 0.013181486167013645 2023-01-22 17:56:04.266253: step: 1320/530, loss: 0.012903379276394844 2023-01-22 17:56:05.354580: step: 1324/530, loss: 0.0036061087157577276 2023-01-22 17:56:06.427488: step: 1328/530, loss: 0.012627535499632359 2023-01-22 17:56:07.526869: step: 1332/530, loss: 0.00782503467053175 2023-01-22 17:56:08.605176: step: 1336/530, loss: 0.020762721076607704 2023-01-22 17:56:09.695357: step: 1340/530, loss: 0.03078097105026245 2023-01-22 17:56:10.771929: step: 1344/530, loss: 0.01978605054318905 2023-01-22 17:56:11.885859: step: 1348/530, loss: 0.024528084322810173 2023-01-22 17:56:12.978354: step: 1352/530, loss: 0.0026921741664409637 2023-01-22 17:56:14.041080: step: 1356/530, loss: 0.008660894818603992 2023-01-22 17:56:15.125777: step: 1360/530, loss: 0.009936562739312649 2023-01-22 17:56:16.206603: step: 1364/530, loss: 0.009195527993142605 2023-01-22 17:56:17.312580: step: 1368/530, loss: 0.005268219392746687 2023-01-22 17:56:18.391906: step: 1372/530, loss: 0.00024246703833341599 2023-01-22 17:56:19.467080: step: 1376/530, loss: 0.008973626419901848 2023-01-22 17:56:20.542820: step: 1380/530, loss: 0.0010981213999912143 2023-01-22 17:56:21.635432: step: 1384/530, loss: 0.0008329460397362709 2023-01-22 17:56:22.711106: step: 1388/530, loss: 0.013117737136781216 2023-01-22 17:56:23.792107: step: 1392/530, loss: 0.0015662973746657372 2023-01-22 17:56:24.908157: step: 1396/530, loss: 0.0262934397906065 2023-01-22 17:56:25.977343: step: 1400/530, loss: 0.0017349009867757559 2023-01-22 17:56:27.104190: step: 1404/530, loss: 0.043029069900512695 2023-01-22 17:56:28.200485: step: 1408/530, loss: 0.02065475657582283 2023-01-22 17:56:29.298588: step: 1412/530, loss: 0.010066530667245388 2023-01-22 17:56:30.397315: step: 1416/530, loss: 0.0075648087076842785 2023-01-22 17:56:31.466840: step: 1420/530, loss: 0.006466331426054239 2023-01-22 17:56:32.561336: step: 1424/530, loss: 0.010740979574620724 2023-01-22 17:56:33.660188: step: 1428/530, loss: 0.008851229213178158 2023-01-22 17:56:34.743845: step: 1432/530, loss: 0.004348272457718849 2023-01-22 17:56:35.864599: step: 1436/530, loss: 0.009712323546409607 2023-01-22 17:56:36.942434: step: 1440/530, loss: 0.00931523647159338 2023-01-22 17:56:38.029661: step: 1444/530, loss: 0.008745982311666012 2023-01-22 17:56:39.110651: step: 1448/530, loss: 0.004645561799407005 2023-01-22 17:56:40.177604: step: 1452/530, loss: 0.006835793145000935 2023-01-22 17:56:41.283182: step: 1456/530, loss: 0.005716282874345779 2023-01-22 17:56:42.396769: step: 1460/530, loss: 0.002697772579267621 2023-01-22 17:56:43.491283: step: 1464/530, loss: 0.017428727820515633 2023-01-22 17:56:44.607468: step: 1468/530, loss: 0.00808794517070055 2023-01-22 17:56:45.715938: step: 1472/530, loss: 0.004085040185600519 2023-01-22 17:56:46.812162: step: 1476/530, loss: 0.007563811726868153 2023-01-22 17:56:47.882247: step: 1480/530, loss: 0.015021136961877346 2023-01-22 17:56:48.963152: step: 1484/530, loss: 0.03507441654801369 2023-01-22 17:56:50.059277: step: 1488/530, loss: 0.022063041105866432 2023-01-22 17:56:51.158476: step: 1492/530, loss: 0.0016781722661107779 2023-01-22 17:56:52.244146: step: 1496/530, loss: 0.0037427227944135666 2023-01-22 17:56:53.330556: step: 1500/530, loss: 0.0059233796782791615 2023-01-22 17:56:54.408506: step: 1504/530, loss: 0.001936563989147544 2023-01-22 17:56:55.509036: step: 1508/530, loss: 0.005255910102277994 2023-01-22 17:56:56.604827: step: 1512/530, loss: 0.05116692930459976 2023-01-22 17:56:57.687876: step: 1516/530, loss: 0.002298779087141156 2023-01-22 17:56:58.774300: step: 1520/530, loss: 0.005176724400371313 2023-01-22 17:56:59.859133: step: 1524/530, loss: 0.00435676658526063 2023-01-22 17:57:00.948616: step: 1528/530, loss: 0.00561439897865057 2023-01-22 17:57:02.050985: step: 1532/530, loss: 0.027845002710819244 2023-01-22 17:57:03.138078: step: 1536/530, loss: 0.01168154552578926 2023-01-22 17:57:04.228990: step: 1540/530, loss: 0.0070859710685908794 2023-01-22 17:57:05.327704: step: 1544/530, loss: 0.008946003392338753 2023-01-22 17:57:06.376357: step: 1548/530, loss: 0.016834719106554985 2023-01-22 17:57:07.451039: step: 1552/530, loss: 0.009201685898005962 2023-01-22 17:57:08.576177: step: 1556/530, loss: 0.0068786353804171085 2023-01-22 17:57:09.640572: step: 1560/530, loss: 0.0142699358984828 2023-01-22 17:57:10.736933: step: 1564/530, loss: 0.008466634899377823 2023-01-22 17:57:11.865637: step: 1568/530, loss: 0.0026678431313484907 2023-01-22 17:57:12.955170: step: 1572/530, loss: 0.0048872740007936954 2023-01-22 17:57:14.059965: step: 1576/530, loss: 0.008471204899251461 2023-01-22 17:57:15.153567: step: 1580/530, loss: 0.00534965842962265 2023-01-22 17:57:16.274330: step: 1584/530, loss: 0.025050774216651917 2023-01-22 17:57:17.360958: step: 1588/530, loss: 0.0031647684518247843 2023-01-22 17:57:18.444190: step: 1592/530, loss: 0.006447574123740196 2023-01-22 17:57:19.535735: step: 1596/530, loss: 0.019744012504816055 2023-01-22 17:57:20.630171: step: 1600/530, loss: 0.012958145700395107 2023-01-22 17:57:21.733449: step: 1604/530, loss: 0.008241388015449047 2023-01-22 17:57:22.814637: step: 1608/530, loss: 0.003305027959868312 2023-01-22 17:57:23.899684: step: 1612/530, loss: 0.01975034549832344 2023-01-22 17:57:25.011860: step: 1616/530, loss: 0.014768530614674091 2023-01-22 17:57:26.067074: step: 1620/530, loss: 0.03643510118126869 2023-01-22 17:57:27.145440: step: 1624/530, loss: 0.0020543818827718496 2023-01-22 17:57:28.231491: step: 1628/530, loss: 0.003917388617992401 2023-01-22 17:57:29.320958: step: 1632/530, loss: 8.823875396046788e-05 2023-01-22 17:57:30.412952: step: 1636/530, loss: 0.003380486276000738 2023-01-22 17:57:31.483600: step: 1640/530, loss: 0.0044584074057638645 2023-01-22 17:57:32.581684: step: 1644/530, loss: 0.036464858800172806 2023-01-22 17:57:33.672493: step: 1648/530, loss: 0.004702022764831781 2023-01-22 17:57:34.795197: step: 1652/530, loss: 0.017135631293058395 2023-01-22 17:57:35.888745: step: 1656/530, loss: 0.0071953521110117435 2023-01-22 17:57:36.992830: step: 1660/530, loss: 0.00426038634032011 2023-01-22 17:57:38.092184: step: 1664/530, loss: 0.007563033606857061 2023-01-22 17:57:39.188265: step: 1668/530, loss: 0.0027075540274381638 2023-01-22 17:57:40.283202: step: 1672/530, loss: 0.015235417522490025 2023-01-22 17:57:41.378106: step: 1676/530, loss: 0.1320732980966568 2023-01-22 17:57:42.470538: step: 1680/530, loss: 0.003960240166634321 2023-01-22 17:57:43.574945: step: 1684/530, loss: 0.0065732491202652454 2023-01-22 17:57:44.675863: step: 1688/530, loss: 0.05801035463809967 2023-01-22 17:57:45.783362: step: 1692/530, loss: 0.0005680571775883436 2023-01-22 17:57:46.877506: step: 1696/530, loss: 0.00609312579035759 2023-01-22 17:57:47.976353: step: 1700/530, loss: 0.00030032210634090006 2023-01-22 17:57:49.080477: step: 1704/530, loss: 0.007867347449064255 2023-01-22 17:57:50.161689: step: 1708/530, loss: 0.015998782590031624 2023-01-22 17:57:51.265279: step: 1712/530, loss: 0.011615244671702385 2023-01-22 17:57:52.377850: step: 1716/530, loss: 0.027224913239479065 2023-01-22 17:57:53.473536: step: 1720/530, loss: 0.007757535204291344 2023-01-22 17:57:54.567385: step: 1724/530, loss: 0.005203958600759506 2023-01-22 17:57:55.661174: step: 1728/530, loss: 0.007733961101621389 2023-01-22 17:57:56.749002: step: 1732/530, loss: 0.0973784476518631 2023-01-22 17:57:57.844544: step: 1736/530, loss: 0.007953282445669174 2023-01-22 17:57:58.942545: step: 1740/530, loss: 0.0162724070250988 2023-01-22 17:58:00.052316: step: 1744/530, loss: 0.006409160792827606 2023-01-22 17:58:01.126558: step: 1748/530, loss: 0.0072939214296638966 2023-01-22 17:58:02.220146: step: 1752/530, loss: 0.006528573110699654 2023-01-22 17:58:03.314494: step: 1756/530, loss: 0.0005678427987731993 2023-01-22 17:58:04.401334: step: 1760/530, loss: 0.0056610689498484135 2023-01-22 17:58:05.479997: step: 1764/530, loss: 0.03463749587535858 2023-01-22 17:58:06.560837: step: 1768/530, loss: 0.001118711894378066 2023-01-22 17:58:07.677523: step: 1772/530, loss: 0.008784106932580471 2023-01-22 17:58:08.763433: step: 1776/530, loss: 0.00478857709094882 2023-01-22 17:58:09.844253: step: 1780/530, loss: 0.00412032101303339 2023-01-22 17:58:10.940010: step: 1784/530, loss: 0.006077309604734182 2023-01-22 17:58:12.041813: step: 1788/530, loss: 0.007692502345889807 2023-01-22 17:58:13.136028: step: 1792/530, loss: 0.005792549811303616 2023-01-22 17:58:14.223442: step: 1796/530, loss: 0.0033693709410727024 2023-01-22 17:58:15.309459: step: 1800/530, loss: 0.0012090852251276374 2023-01-22 17:58:16.400208: step: 1804/530, loss: 0.020762303844094276 2023-01-22 17:58:17.495217: step: 1808/530, loss: 0.00416500074788928 2023-01-22 17:58:18.607727: step: 1812/530, loss: 0.02418254129588604 2023-01-22 17:58:19.691583: step: 1816/530, loss: 0.012921021319925785 2023-01-22 17:58:20.789867: step: 1820/530, loss: 0.004524185787886381 2023-01-22 17:58:21.892250: step: 1824/530, loss: 0.003047233447432518 2023-01-22 17:58:22.993967: step: 1828/530, loss: 0.013662545010447502 2023-01-22 17:58:24.072013: step: 1832/530, loss: 0.0187588632106781 2023-01-22 17:58:25.175571: step: 1836/530, loss: 0.005499811843037605 2023-01-22 17:58:26.290632: step: 1840/530, loss: 0.02362939529120922 2023-01-22 17:58:27.384860: step: 1844/530, loss: 0.004111357033252716 2023-01-22 17:58:28.480825: step: 1848/530, loss: 0.010315585881471634 2023-01-22 17:58:29.578754: step: 1852/530, loss: 0.0072876568883657455 2023-01-22 17:58:30.661065: step: 1856/530, loss: 0.010600189678370953 2023-01-22 17:58:31.760240: step: 1860/530, loss: 0.01006628479808569 2023-01-22 17:58:32.848797: step: 1864/530, loss: 0.004517877474427223 2023-01-22 17:58:33.937750: step: 1868/530, loss: 0.010671298950910568 2023-01-22 17:58:34.995016: step: 1872/530, loss: 0.0008903589914552867 2023-01-22 17:58:36.075862: step: 1876/530, loss: 0.06083684042096138 2023-01-22 17:58:37.164174: step: 1880/530, loss: 0.037631455808877945 2023-01-22 17:58:38.243567: step: 1884/530, loss: 0.0668218582868576 2023-01-22 17:58:39.318229: step: 1888/530, loss: 0.026623815298080444 2023-01-22 17:58:40.417071: step: 1892/530, loss: 0.033049069344997406 2023-01-22 17:58:41.486576: step: 1896/530, loss: 0.01622823253273964 2023-01-22 17:58:42.577136: step: 1900/530, loss: 0.0043643200770020485 2023-01-22 17:58:43.675075: step: 1904/530, loss: 0.009135270491242409 2023-01-22 17:58:44.747557: step: 1908/530, loss: 0.01555678527802229 2023-01-22 17:58:45.865169: step: 1912/530, loss: 0.010884417220950127 2023-01-22 17:58:46.955035: step: 1916/530, loss: 0.011741231195628643 2023-01-22 17:58:48.051379: step: 1920/530, loss: 0.006384402513504028 2023-01-22 17:58:49.122180: step: 1924/530, loss: 0.023064740002155304 2023-01-22 17:58:50.199777: step: 1928/530, loss: 0.007335499860346317 2023-01-22 17:58:51.315623: step: 1932/530, loss: 0.002174460794776678 2023-01-22 17:58:52.409574: step: 1936/530, loss: 0.0009123747004196048 2023-01-22 17:58:53.504634: step: 1940/530, loss: 0.03267615661025047 2023-01-22 17:58:54.589150: step: 1944/530, loss: 0.01721155270934105 2023-01-22 17:58:55.666515: step: 1948/530, loss: 0.00958101637661457 2023-01-22 17:58:56.767913: step: 1952/530, loss: 0.00603700103238225 2023-01-22 17:58:57.864763: step: 1956/530, loss: 0.002537440275773406 2023-01-22 17:58:58.941687: step: 1960/530, loss: 0.0025301428977400064 2023-01-22 17:59:00.039017: step: 1964/530, loss: 0.012461566366255283 2023-01-22 17:59:01.126138: step: 1968/530, loss: 0.023656077682971954 2023-01-22 17:59:02.218506: step: 1972/530, loss: 0.007463125512003899 2023-01-22 17:59:03.297365: step: 1976/530, loss: 0.003984319977462292 2023-01-22 17:59:04.390906: step: 1980/530, loss: 0.018382729962468147 2023-01-22 17:59:05.491332: step: 1984/530, loss: 0.0034127768594771624 2023-01-22 17:59:06.592066: step: 1988/530, loss: 0.01551706250756979 2023-01-22 17:59:07.699721: step: 1992/530, loss: 0.020493097603321075 2023-01-22 17:59:08.778970: step: 1996/530, loss: 0.05537712201476097 2023-01-22 17:59:09.859915: step: 2000/530, loss: 0.004812260624021292 2023-01-22 17:59:10.956700: step: 2004/530, loss: 0.004523058421909809 2023-01-22 17:59:12.052531: step: 2008/530, loss: 0.009608150459825993 2023-01-22 17:59:13.146060: step: 2012/530, loss: 0.004829746205359697 2023-01-22 17:59:14.246247: step: 2016/530, loss: 0.004766157828271389 2023-01-22 17:59:15.341928: step: 2020/530, loss: 0.006347528658807278 2023-01-22 17:59:16.421831: step: 2024/530, loss: 0.022239279001951218 2023-01-22 17:59:17.496722: step: 2028/530, loss: 0.0022849151864647865 2023-01-22 17:59:18.587019: step: 2032/530, loss: 0.01862087845802307 2023-01-22 17:59:19.666506: step: 2036/530, loss: 0.006219734437763691 2023-01-22 17:59:20.770740: step: 2040/530, loss: 0.006357923150062561 2023-01-22 17:59:21.872576: step: 2044/530, loss: 0.004786049947142601 2023-01-22 17:59:22.963930: step: 2048/530, loss: 0.003965491894632578 2023-01-22 17:59:24.038845: step: 2052/530, loss: 0.007487200200557709 2023-01-22 17:59:25.126283: step: 2056/530, loss: 0.014578355476260185 2023-01-22 17:59:26.214991: step: 2060/530, loss: 0.0032622357830405235 2023-01-22 17:59:27.313558: step: 2064/530, loss: 0.008332009427249432 2023-01-22 17:59:28.418675: step: 2068/530, loss: 0.01456921361386776 2023-01-22 17:59:29.512784: step: 2072/530, loss: 0.008971704170107841 2023-01-22 17:59:30.601428: step: 2076/530, loss: 0.008645850233733654 2023-01-22 17:59:31.700818: step: 2080/530, loss: 0.012069402262568474 2023-01-22 17:59:32.796622: step: 2084/530, loss: 0.002603366272523999 2023-01-22 17:59:33.878953: step: 2088/530, loss: 0.0016511273570358753 2023-01-22 17:59:34.983397: step: 2092/530, loss: 0.011426740325987339 2023-01-22 17:59:36.068669: step: 2096/530, loss: 0.0041406708769500256 2023-01-22 17:59:37.138614: step: 2100/530, loss: 0.005497670266777277 2023-01-22 17:59:38.233989: step: 2104/530, loss: 0.0884915366768837 2023-01-22 17:59:39.330618: step: 2108/530, loss: 0.0007639945833943784 2023-01-22 17:59:40.414574: step: 2112/530, loss: 0.012787983752787113 2023-01-22 17:59:41.530822: step: 2116/530, loss: 0.00024670781567692757 2023-01-22 17:59:42.616994: step: 2120/530, loss: 0.02791227400302887 ================================================== Loss: 0.012 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33718307593307595, 'r': 0.3550979262672811, 'f1': 0.3459087008185899}, 'combined': 0.2548800953400136, 'stategy': 1, 'epoch': 4} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33073405461480215, 'r': 0.2885335669339817, 'f1': 0.30819591777100425}, 'combined': 0.19140588577357107, 'stategy': 1, 'epoch': 4} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33917510550090635, 'r': 0.3256595889629196, 'f1': 0.3322799678285743}, 'combined': 0.24483787103158103, 'stategy': 1, 'epoch': 4} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3437305177287306, 'r': 0.29758308395666017, 'f1': 0.31899646989216585}, 'combined': 0.19811359709092408, 'stategy': 1, 'epoch': 4} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 4} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 4} New best korean model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34039493836931506, 'r': 0.331352188583413, 'f1': 0.33581269881434356}, 'combined': 0.24744093596846367, 'stategy': 1, 'epoch': 3} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3460110194391069, 'r': 0.2995574176190491, 'f1': 0.3211128720085679}, 'combined': 0.19942799419479482, 'stategy': 1, 'epoch': 3} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 3} ****************************** Epoch: 5 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 18:02:23.596357: step: 4/530, loss: 0.009927969425916672 2023-01-22 18:02:24.678838: step: 8/530, loss: 0.005128829274326563 2023-01-22 18:02:25.762905: step: 12/530, loss: 0.04475068673491478 2023-01-22 18:02:26.870918: step: 16/530, loss: 0.009328820742666721 2023-01-22 18:02:27.936831: step: 20/530, loss: 0.00403439300134778 2023-01-22 18:02:29.012668: step: 24/530, loss: 0.01125125028192997 2023-01-22 18:02:30.111642: step: 28/530, loss: 0.0048458450473845005 2023-01-22 18:02:31.198964: step: 32/530, loss: 0.013264902867376804 2023-01-22 18:02:32.309179: step: 36/530, loss: 0.018973875790834427 2023-01-22 18:02:33.403733: step: 40/530, loss: 0.016321133822202682 2023-01-22 18:02:34.495854: step: 44/530, loss: 0.010839315131306648 2023-01-22 18:02:35.577898: step: 48/530, loss: 0.006358737591654062 2023-01-22 18:02:36.643954: step: 52/530, loss: 0.008591302670538425 2023-01-22 18:02:37.742046: step: 56/530, loss: 0.0012758837547153234 2023-01-22 18:02:38.824838: step: 60/530, loss: 0.004210789687931538 2023-01-22 18:02:39.934494: step: 64/530, loss: 0.011850784532725811 2023-01-22 18:02:41.032479: step: 68/530, loss: 0.00352488667704165 2023-01-22 18:02:42.133448: step: 72/530, loss: 0.0006779723917134106 2023-01-22 18:02:43.235461: step: 76/530, loss: 0.019818367436528206 2023-01-22 18:02:44.304606: step: 80/530, loss: 0.002778246533125639 2023-01-22 18:02:45.412345: step: 84/530, loss: 0.01132697518914938 2023-01-22 18:02:46.516340: step: 88/530, loss: 0.02920081838965416 2023-01-22 18:02:47.656464: step: 92/530, loss: 0.06911709159612656 2023-01-22 18:02:48.772339: step: 96/530, loss: 0.006899694446474314 2023-01-22 18:02:49.861564: step: 100/530, loss: 0.01456447783857584 2023-01-22 18:02:50.952483: step: 104/530, loss: 0.006375570315867662 2023-01-22 18:02:52.053295: step: 108/530, loss: 0.0024532810784876347 2023-01-22 18:02:53.159079: step: 112/530, loss: 0.0017753717256709933 2023-01-22 18:02:54.249702: step: 116/530, loss: 0.011672258377075195 2023-01-22 18:02:55.375770: step: 120/530, loss: 0.00401636678725481 2023-01-22 18:02:56.511524: step: 124/530, loss: 0.01942227967083454 2023-01-22 18:02:57.603489: step: 128/530, loss: 0.005506512243300676 2023-01-22 18:02:58.712917: step: 132/530, loss: 0.0021414831280708313 2023-01-22 18:02:59.798243: step: 136/530, loss: 0.005920359864830971 2023-01-22 18:03:00.903010: step: 140/530, loss: 0.003510456532239914 2023-01-22 18:03:01.975270: step: 144/530, loss: 0.002353669609874487 2023-01-22 18:03:03.075413: step: 148/530, loss: 0.010640815831720829 2023-01-22 18:03:04.175622: step: 152/530, loss: 0.03576274216175079 2023-01-22 18:03:05.254127: step: 156/530, loss: 0.008341441862285137 2023-01-22 18:03:06.352823: step: 160/530, loss: 0.003986270632594824 2023-01-22 18:03:07.431339: step: 164/530, loss: 0.001406124560162425 2023-01-22 18:03:08.517309: step: 168/530, loss: 0.009706404060125351 2023-01-22 18:03:09.599369: step: 172/530, loss: 0.004061954095959663 2023-01-22 18:03:10.699866: step: 176/530, loss: 0.005667248275130987 2023-01-22 18:03:11.826088: step: 180/530, loss: 0.005562384147197008 2023-01-22 18:03:12.943020: step: 184/530, loss: 0.008082667365670204 2023-01-22 18:03:14.031910: step: 188/530, loss: 0.007437993306666613 2023-01-22 18:03:15.096801: step: 192/530, loss: 0.004453169647604227 2023-01-22 18:03:16.186738: step: 196/530, loss: 5.284436701913364e-05 2023-01-22 18:03:17.300930: step: 200/530, loss: 0.03970012813806534 2023-01-22 18:03:18.413408: step: 204/530, loss: 0.0004708790220320225 2023-01-22 18:03:19.492035: step: 208/530, loss: 0.01243553962558508 2023-01-22 18:03:20.584873: step: 212/530, loss: 0.014587502926588058 2023-01-22 18:03:21.664582: step: 216/530, loss: 0.00047801644541323185 2023-01-22 18:03:22.741171: step: 220/530, loss: 0.01798751763999462 2023-01-22 18:03:23.828213: step: 224/530, loss: 0.002520455978810787 2023-01-22 18:03:24.927347: step: 228/530, loss: 0.006364905741065741 2023-01-22 18:03:26.010127: step: 232/530, loss: 0.028661977499723434 2023-01-22 18:03:27.116522: step: 236/530, loss: 0.004739727824926376 2023-01-22 18:03:28.211337: step: 240/530, loss: 0.0007106245029717684 2023-01-22 18:03:29.309979: step: 244/530, loss: 0.0038836118765175343 2023-01-22 18:03:30.390646: step: 248/530, loss: 0.0033591161482036114 2023-01-22 18:03:31.471257: step: 252/530, loss: 0.01268624048680067 2023-01-22 18:03:32.560600: step: 256/530, loss: 0.0034052045084536076 2023-01-22 18:03:33.650437: step: 260/530, loss: 0.004034136421978474 2023-01-22 18:03:34.748169: step: 264/530, loss: 0.004076881799846888 2023-01-22 18:03:35.831361: step: 268/530, loss: 0.0006219844799488783 2023-01-22 18:03:36.913353: step: 272/530, loss: 0.0031220486853271723 2023-01-22 18:03:38.027198: step: 276/530, loss: 0.00915757566690445 2023-01-22 18:03:39.122402: step: 280/530, loss: 0.0012872337829321623 2023-01-22 18:03:40.218482: step: 284/530, loss: 0.002386258915066719 2023-01-22 18:03:41.314040: step: 288/530, loss: 0.004436228424310684 2023-01-22 18:03:42.409221: step: 292/530, loss: 0.006758742965757847 2023-01-22 18:03:43.506419: step: 296/530, loss: 0.007563683204352856 2023-01-22 18:03:44.624605: step: 300/530, loss: 0.005827596411108971 2023-01-22 18:03:45.720316: step: 304/530, loss: 0.0043299635872244835 2023-01-22 18:03:46.830192: step: 308/530, loss: 0.00750034861266613 2023-01-22 18:03:47.923002: step: 312/530, loss: 0.005572655238211155 2023-01-22 18:03:49.021574: step: 316/530, loss: 0.003433826146647334 2023-01-22 18:03:50.102661: step: 320/530, loss: 0.00217996072024107 2023-01-22 18:03:51.201717: step: 324/530, loss: 0.012475233525037766 2023-01-22 18:03:52.292572: step: 328/530, loss: 0.0126360934227705 2023-01-22 18:03:53.408241: step: 332/530, loss: 0.006459742784500122 2023-01-22 18:03:54.505235: step: 336/530, loss: 0.006656565237790346 2023-01-22 18:03:55.592959: step: 340/530, loss: 0.01680254004895687 2023-01-22 18:03:56.670102: step: 344/530, loss: 0.003458525286987424 2023-01-22 18:03:57.769764: step: 348/530, loss: 0.007182309869676828 2023-01-22 18:03:58.879736: step: 352/530, loss: 0.0039078895933926105 2023-01-22 18:03:59.955956: step: 356/530, loss: 0.0017451149178668857 2023-01-22 18:04:01.019871: step: 360/530, loss: 3.626816032920033e-05 2023-01-22 18:04:02.117813: step: 364/530, loss: 0.005791897885501385 2023-01-22 18:04:03.211311: step: 368/530, loss: 0.005260811187326908 2023-01-22 18:04:04.291674: step: 372/530, loss: 0.0026299997698515654 2023-01-22 18:04:05.396152: step: 376/530, loss: 0.029537083581089973 2023-01-22 18:04:06.504200: step: 380/530, loss: 0.02752068266272545 2023-01-22 18:04:07.582229: step: 384/530, loss: 0.005755385383963585 2023-01-22 18:04:08.681359: step: 388/530, loss: 0.005558202508836985 2023-01-22 18:04:09.766011: step: 392/530, loss: 0.047580499202013016 2023-01-22 18:04:10.850686: step: 396/530, loss: 0.035065244883298874 2023-01-22 18:04:11.957415: step: 400/530, loss: 0.0002280263288412243 2023-01-22 18:04:13.050642: step: 404/530, loss: 0.0006840199930593371 2023-01-22 18:04:14.123007: step: 408/530, loss: 0.0070375413633883 2023-01-22 18:04:15.193042: step: 412/530, loss: 0.013827987015247345 2023-01-22 18:04:16.285260: step: 416/530, loss: 0.008810057304799557 2023-01-22 18:04:17.382104: step: 420/530, loss: 0.0017100953264161944 2023-01-22 18:04:18.489780: step: 424/530, loss: 0.005180246662348509 2023-01-22 18:04:19.594680: step: 428/530, loss: 0.02431401051580906 2023-01-22 18:04:20.669110: step: 432/530, loss: 0.01683223247528076 2023-01-22 18:04:21.776295: step: 436/530, loss: 0.030931025743484497 2023-01-22 18:04:22.899173: step: 440/530, loss: 0.00038184644654393196 2023-01-22 18:04:24.019747: step: 444/530, loss: 0.003955648746341467 2023-01-22 18:04:25.113280: step: 448/530, loss: 0.03574395924806595 2023-01-22 18:04:26.192002: step: 452/530, loss: 0.007264542859047651 2023-01-22 18:04:27.316718: step: 456/530, loss: 0.015016872435808182 2023-01-22 18:04:28.421934: step: 460/530, loss: 0.0055486224591732025 2023-01-22 18:04:29.503125: step: 464/530, loss: 0.007629780564457178 2023-01-22 18:04:30.600002: step: 468/530, loss: 0.005283321253955364 2023-01-22 18:04:31.681466: step: 472/530, loss: 0.0037030719686299562 2023-01-22 18:04:32.779085: step: 476/530, loss: 0.009584475308656693 2023-01-22 18:04:33.873483: step: 480/530, loss: 0.10841675102710724 2023-01-22 18:04:34.970119: step: 484/530, loss: 0.007172941230237484 2023-01-22 18:04:36.079338: step: 488/530, loss: 0.007054260466247797 2023-01-22 18:04:37.156459: step: 492/530, loss: 0.0069967638701200485 2023-01-22 18:04:38.245171: step: 496/530, loss: 0.007977736182510853 2023-01-22 18:04:39.322648: step: 500/530, loss: 0.005747297313064337 2023-01-22 18:04:40.418653: step: 504/530, loss: 0.014383424073457718 2023-01-22 18:04:41.493992: step: 508/530, loss: 0.006413948722183704 2023-01-22 18:04:42.605596: step: 512/530, loss: 0.021535467356443405 2023-01-22 18:04:43.700025: step: 516/530, loss: 0.013873053714632988 2023-01-22 18:04:44.793657: step: 520/530, loss: 0.0021121506579220295 2023-01-22 18:04:45.892893: step: 524/530, loss: 0.007193238474428654 2023-01-22 18:04:46.993346: step: 528/530, loss: 0.005421261768788099 2023-01-22 18:04:48.080234: step: 532/530, loss: 0.02269272319972515 2023-01-22 18:04:49.183532: step: 536/530, loss: 0.020114630460739136 2023-01-22 18:04:50.279394: step: 540/530, loss: 0.028823966160416603 2023-01-22 18:04:51.350426: step: 544/530, loss: 0.005062198266386986 2023-01-22 18:04:52.471598: step: 548/530, loss: 0.004133230075240135 2023-01-22 18:04:53.580401: step: 552/530, loss: 0.004652720410376787 2023-01-22 18:04:54.685964: step: 556/530, loss: 0.0068655614741146564 2023-01-22 18:04:55.788604: step: 560/530, loss: 0.01430361345410347 2023-01-22 18:04:56.887500: step: 564/530, loss: 0.005681750364601612 2023-01-22 18:04:57.962945: step: 568/530, loss: 0.0023478225339204073 2023-01-22 18:04:59.066330: step: 572/530, loss: 0.0022609184961766005 2023-01-22 18:05:00.179845: step: 576/530, loss: 0.006015228573232889 2023-01-22 18:05:01.270689: step: 580/530, loss: 0.004941890016198158 2023-01-22 18:05:02.355110: step: 584/530, loss: 0.017170375213027 2023-01-22 18:05:03.476898: step: 588/530, loss: 0.02504393830895424 2023-01-22 18:05:04.564980: step: 592/530, loss: 0.012134358286857605 2023-01-22 18:05:05.662776: step: 596/530, loss: 0.031021377071738243 2023-01-22 18:05:06.738477: step: 600/530, loss: 0.0015711723826825619 2023-01-22 18:05:07.800409: step: 604/530, loss: 0.0014493025373667479 2023-01-22 18:05:08.910563: step: 608/530, loss: 0.020252171903848648 2023-01-22 18:05:10.015145: step: 612/530, loss: 0.0039865863509476185 2023-01-22 18:05:11.096930: step: 616/530, loss: 0.016128981485962868 2023-01-22 18:05:12.165052: step: 620/530, loss: 0.038906656205654144 2023-01-22 18:05:13.287645: step: 624/530, loss: 0.010242643766105175 2023-01-22 18:05:14.354038: step: 628/530, loss: 0.010289092548191547 2023-01-22 18:05:15.438927: step: 632/530, loss: 0.0020376669708639383 2023-01-22 18:05:16.510702: step: 636/530, loss: 0.04130535572767258 2023-01-22 18:05:17.592281: step: 640/530, loss: 0.008746541105210781 2023-01-22 18:05:18.695647: step: 644/530, loss: 0.009842237457633018 2023-01-22 18:05:19.798762: step: 648/530, loss: 0.022690266370773315 2023-01-22 18:05:20.884302: step: 652/530, loss: 0.017371635884046555 2023-01-22 18:05:21.981722: step: 656/530, loss: 0.004394746385514736 2023-01-22 18:05:23.065923: step: 660/530, loss: 0.005064487922936678 2023-01-22 18:05:24.146510: step: 664/530, loss: 0.0037051455583423376 2023-01-22 18:05:25.221143: step: 668/530, loss: 0.0002648273075465113 2023-01-22 18:05:26.307309: step: 672/530, loss: 0.0028208144940435886 2023-01-22 18:05:27.413883: step: 676/530, loss: 0.01486341655254364 2023-01-22 18:05:28.506097: step: 680/530, loss: 0.013482906855642796 2023-01-22 18:05:29.585626: step: 684/530, loss: 0.0019089989364147186 2023-01-22 18:05:30.672827: step: 688/530, loss: 0.025296710431575775 2023-01-22 18:05:31.770413: step: 692/530, loss: 0.0018094453262165189 2023-01-22 18:05:32.883225: step: 696/530, loss: 0.005951243452727795 2023-01-22 18:05:33.960048: step: 700/530, loss: 0.002945193089544773 2023-01-22 18:05:35.066994: step: 704/530, loss: 0.004906233865767717 2023-01-22 18:05:36.150980: step: 708/530, loss: 0.0020124120637774467 2023-01-22 18:05:37.230737: step: 712/530, loss: 0.004250792786478996 2023-01-22 18:05:38.352266: step: 716/530, loss: 0.06334321945905685 2023-01-22 18:05:39.449456: step: 720/530, loss: 0.012508920393884182 2023-01-22 18:05:40.531301: step: 724/530, loss: 0.0014923866838216782 2023-01-22 18:05:41.641703: step: 728/530, loss: 0.00275184097699821 2023-01-22 18:05:42.740206: step: 732/530, loss: 0.008599773980677128 2023-01-22 18:05:43.864647: step: 736/530, loss: 0.0076149520464241505 2023-01-22 18:05:44.964982: step: 740/530, loss: 0.02288990281522274 2023-01-22 18:05:46.061680: step: 744/530, loss: 0.006646342575550079 2023-01-22 18:05:47.156609: step: 748/530, loss: 0.0033843473065644503 2023-01-22 18:05:48.239605: step: 752/530, loss: 0.0006627660477533937 2023-01-22 18:05:49.335064: step: 756/530, loss: 0.003157450584694743 2023-01-22 18:05:50.429725: step: 760/530, loss: 0.028473051264882088 2023-01-22 18:05:51.539057: step: 764/530, loss: 0.004545000847429037 2023-01-22 18:05:52.641370: step: 768/530, loss: 0.0012491007801145315 2023-01-22 18:05:53.728450: step: 772/530, loss: 0.005975918844342232 2023-01-22 18:05:54.830725: step: 776/530, loss: 0.03943159058690071 2023-01-22 18:05:55.967320: step: 780/530, loss: 0.01770174689590931 2023-01-22 18:05:57.065352: step: 784/530, loss: 0.008249512873589993 2023-01-22 18:05:58.147138: step: 788/530, loss: 0.011769704520702362 2023-01-22 18:05:59.232054: step: 792/530, loss: 0.008093920536339283 2023-01-22 18:06:00.321874: step: 796/530, loss: 0.009733738377690315 2023-01-22 18:06:01.423734: step: 800/530, loss: 0.0033110210206359625 2023-01-22 18:06:02.517857: step: 804/530, loss: 0.006189823616296053 2023-01-22 18:06:03.635397: step: 808/530, loss: 0.018803108483552933 2023-01-22 18:06:04.722213: step: 812/530, loss: 0.05368834733963013 2023-01-22 18:06:05.814264: step: 816/530, loss: 0.014654400758445263 2023-01-22 18:06:06.902292: step: 820/530, loss: 0.015123249962925911 2023-01-22 18:06:08.019336: step: 824/530, loss: 0.02406453527510166 2023-01-22 18:06:09.109763: step: 828/530, loss: 0.0017264683265239 2023-01-22 18:06:10.223741: step: 832/530, loss: 0.006244051735848188 2023-01-22 18:06:11.297982: step: 836/530, loss: 0.0006846334435977042 2023-01-22 18:06:12.380893: step: 840/530, loss: 0.013209469616413116 2023-01-22 18:06:13.497610: step: 844/530, loss: 0.004798524081707001 2023-01-22 18:06:14.579288: step: 848/530, loss: 0.016030339524149895 2023-01-22 18:06:15.665387: step: 852/530, loss: 0.0027581085450947285 2023-01-22 18:06:16.765979: step: 856/530, loss: 0.0014344928786158562 2023-01-22 18:06:17.851426: step: 860/530, loss: 0.01735539920628071 2023-01-22 18:06:18.958212: step: 864/530, loss: 0.006705708801746368 2023-01-22 18:06:20.051219: step: 868/530, loss: 0.01609933376312256 2023-01-22 18:06:21.136814: step: 872/530, loss: 0.034301504492759705 2023-01-22 18:06:22.217242: step: 876/530, loss: 0.005869516171514988 2023-01-22 18:06:23.293231: step: 880/530, loss: 0.008199592120945454 2023-01-22 18:06:24.381291: step: 884/530, loss: 0.003910835832357407 2023-01-22 18:06:25.494969: step: 888/530, loss: 0.02594786509871483 2023-01-22 18:06:26.596313: step: 892/530, loss: 0.0013578069629147649 2023-01-22 18:06:27.675861: step: 896/530, loss: 0.006081853527575731 2023-01-22 18:06:28.779593: step: 900/530, loss: 0.004724468570202589 2023-01-22 18:06:29.834245: step: 904/530, loss: 0.005373109132051468 2023-01-22 18:06:30.927549: step: 908/530, loss: 0.011944221332669258 2023-01-22 18:06:32.038597: step: 912/530, loss: 0.015439932234585285 2023-01-22 18:06:33.133758: step: 916/530, loss: 0.004212393891066313 2023-01-22 18:06:34.207768: step: 920/530, loss: 0.005986310075968504 2023-01-22 18:06:35.320171: step: 924/530, loss: 0.017463088035583496 2023-01-22 18:06:36.446935: step: 928/530, loss: 0.010621001943945885 2023-01-22 18:06:37.514933: step: 932/530, loss: 0.0020706690847873688 2023-01-22 18:06:38.644017: step: 936/530, loss: 0.017201585695147514 2023-01-22 18:06:39.742023: step: 940/530, loss: 0.0015285331755876541 2023-01-22 18:06:40.830121: step: 944/530, loss: 0.004085628781467676 2023-01-22 18:06:41.901861: step: 948/530, loss: 0.0055943639017641544 2023-01-22 18:06:43.024601: step: 952/530, loss: 0.0012125269277021289 2023-01-22 18:06:44.127572: step: 956/530, loss: 0.03324398770928383 2023-01-22 18:06:45.207661: step: 960/530, loss: 0.036107923835515976 2023-01-22 18:06:46.278897: step: 964/530, loss: 0.010087436996400356 2023-01-22 18:06:47.398026: step: 968/530, loss: 0.021248996257781982 2023-01-22 18:06:48.528908: step: 972/530, loss: 0.010942698456346989 2023-01-22 18:06:49.634462: step: 976/530, loss: 0.009958078153431416 2023-01-22 18:06:50.733018: step: 980/530, loss: 0.008440959267318249 2023-01-22 18:06:51.830848: step: 984/530, loss: 0.0015444383025169373 2023-01-22 18:06:52.927687: step: 988/530, loss: 0.011825080029666424 2023-01-22 18:06:54.014392: step: 992/530, loss: 0.042501576244831085 2023-01-22 18:06:55.110226: step: 996/530, loss: 0.022968651726841927 2023-01-22 18:06:56.198191: step: 1000/530, loss: 0.00941373035311699 2023-01-22 18:06:57.320815: step: 1004/530, loss: 0.003551363479346037 2023-01-22 18:06:58.398447: step: 1008/530, loss: 0.0031270224135369062 2023-01-22 18:06:59.479201: step: 1012/530, loss: 0.0016350416699424386 2023-01-22 18:07:00.592010: step: 1016/530, loss: 0.014712892472743988 2023-01-22 18:07:01.665166: step: 1020/530, loss: 0.006596389692276716 2023-01-22 18:07:02.744131: step: 1024/530, loss: 0.012117584235966206 2023-01-22 18:07:03.837041: step: 1028/530, loss: 0.004741362761706114 2023-01-22 18:07:04.927424: step: 1032/530, loss: 0.00014142485451884568 2023-01-22 18:07:06.032165: step: 1036/530, loss: 0.005007429048418999 2023-01-22 18:07:07.123891: step: 1040/530, loss: 0.02516634203493595 2023-01-22 18:07:08.226276: step: 1044/530, loss: 0.016056302934885025 2023-01-22 18:07:09.309495: step: 1048/530, loss: 0.003571026958525181 2023-01-22 18:07:10.410397: step: 1052/530, loss: 0.005324543919414282 2023-01-22 18:07:11.514650: step: 1056/530, loss: 0.009494753554463387 2023-01-22 18:07:12.622956: step: 1060/530, loss: 0.007454304024577141 2023-01-22 18:07:13.739783: step: 1064/530, loss: 0.003984508570283651 2023-01-22 18:07:14.837966: step: 1068/530, loss: 0.007783366832882166 2023-01-22 18:07:15.932249: step: 1072/530, loss: 0.0051447865553200245 2023-01-22 18:07:17.034481: step: 1076/530, loss: 0.024477636441588402 2023-01-22 18:07:18.140021: step: 1080/530, loss: 0.027586881071329117 2023-01-22 18:07:19.232195: step: 1084/530, loss: 0.0050377678126096725 2023-01-22 18:07:20.330344: step: 1088/530, loss: 0.0016665261937305331 2023-01-22 18:07:21.401192: step: 1092/530, loss: 0.022634021937847137 2023-01-22 18:07:22.497439: step: 1096/530, loss: 0.008211866952478886 2023-01-22 18:07:23.562742: step: 1100/530, loss: 0.007138671353459358 2023-01-22 18:07:24.652303: step: 1104/530, loss: 0.03303040564060211 2023-01-22 18:07:25.778488: step: 1108/530, loss: 0.006315619219094515 2023-01-22 18:07:26.849701: step: 1112/530, loss: 0.006362857297062874 2023-01-22 18:07:27.948096: step: 1116/530, loss: 0.003907065838575363 2023-01-22 18:07:29.055491: step: 1120/530, loss: 0.00701772328466177 2023-01-22 18:07:30.138594: step: 1124/530, loss: 0.0060411663725972176 2023-01-22 18:07:31.245514: step: 1128/530, loss: 0.0063125137239694595 2023-01-22 18:07:32.337216: step: 1132/530, loss: 0.0009099377784878016 2023-01-22 18:07:33.429619: step: 1136/530, loss: 0.00436819763854146 2023-01-22 18:07:34.530476: step: 1140/530, loss: 0.006643245927989483 2023-01-22 18:07:35.631196: step: 1144/530, loss: 0.05079443007707596 2023-01-22 18:07:36.733377: step: 1148/530, loss: 0.004961497150361538 2023-01-22 18:07:37.835374: step: 1152/530, loss: 0.004648693837225437 2023-01-22 18:07:38.922207: step: 1156/530, loss: 0.009455114603042603 2023-01-22 18:07:40.004276: step: 1160/530, loss: 0.003025786718353629 2023-01-22 18:07:41.087844: step: 1164/530, loss: 0.002651132410392165 2023-01-22 18:07:42.166035: step: 1168/530, loss: 0.006034562364220619 2023-01-22 18:07:43.267111: step: 1172/530, loss: 0.055347051471471786 2023-01-22 18:07:44.372253: step: 1176/530, loss: 0.04707120358943939 2023-01-22 18:07:45.429474: step: 1180/530, loss: 0.00532685499638319 2023-01-22 18:07:46.510145: step: 1184/530, loss: 0.03385983780026436 2023-01-22 18:07:47.604099: step: 1188/530, loss: 0.006398843601346016 2023-01-22 18:07:48.704254: step: 1192/530, loss: 0.004570150747895241 2023-01-22 18:07:49.799913: step: 1196/530, loss: 0.0069955140352249146 2023-01-22 18:07:50.868512: step: 1200/530, loss: 0.016269484534859657 2023-01-22 18:07:51.936619: step: 1204/530, loss: 0.008860309608280659 2023-01-22 18:07:53.027886: step: 1208/530, loss: 0.001976356143131852 2023-01-22 18:07:54.120262: step: 1212/530, loss: 0.0010373091790825129 2023-01-22 18:07:55.220350: step: 1216/530, loss: 0.005320926196873188 2023-01-22 18:07:56.314898: step: 1220/530, loss: 0.02453349344432354 2023-01-22 18:07:57.384311: step: 1224/530, loss: 0.02141612395644188 2023-01-22 18:07:58.466339: step: 1228/530, loss: 0.0006792772328481078 2023-01-22 18:07:59.576738: step: 1232/530, loss: 0.004519452340900898 2023-01-22 18:08:00.658273: step: 1236/530, loss: 0.03056146204471588 2023-01-22 18:08:01.734361: step: 1240/530, loss: 0.004883999936282635 2023-01-22 18:08:02.839337: step: 1244/530, loss: 0.005924487952142954 2023-01-22 18:08:03.948351: step: 1248/530, loss: 0.02378247119486332 2023-01-22 18:08:05.034372: step: 1252/530, loss: 0.01055564358830452 2023-01-22 18:08:06.119985: step: 1256/530, loss: 0.007359538692981005 2023-01-22 18:08:07.206314: step: 1260/530, loss: 0.008896327577531338 2023-01-22 18:08:08.329617: step: 1264/530, loss: 0.0075872051529586315 2023-01-22 18:08:09.418126: step: 1268/530, loss: 0.004266760777682066 2023-01-22 18:08:10.523951: step: 1272/530, loss: 0.038588110357522964 2023-01-22 18:08:11.615254: step: 1276/530, loss: 0.008576435036957264 2023-01-22 18:08:12.708069: step: 1280/530, loss: 0.028927817940711975 2023-01-22 18:08:13.825912: step: 1284/530, loss: 0.0011064070276916027 2023-01-22 18:08:14.911023: step: 1288/530, loss: 0.024422533810138702 2023-01-22 18:08:16.000690: step: 1292/530, loss: 0.04459747299551964 2023-01-22 18:08:17.072526: step: 1296/530, loss: 0.00013573789328802377 2023-01-22 18:08:18.151945: step: 1300/530, loss: 0.03848407417535782 2023-01-22 18:08:19.272213: step: 1304/530, loss: 0.01567724347114563 2023-01-22 18:08:20.396076: step: 1308/530, loss: 0.07717403769493103 2023-01-22 18:08:21.480264: step: 1312/530, loss: 0.0018159148748964071 2023-01-22 18:08:22.580268: step: 1316/530, loss: 0.031898293644189835 2023-01-22 18:08:23.671547: step: 1320/530, loss: 0.0041343942284584045 2023-01-22 18:08:24.774955: step: 1324/530, loss: 0.0022816993296146393 2023-01-22 18:08:25.867079: step: 1328/530, loss: 0.0031828333158046007 2023-01-22 18:08:26.942277: step: 1332/530, loss: 0.00687678437680006 2023-01-22 18:08:28.023573: step: 1336/530, loss: 0.005433598533272743 2023-01-22 18:08:29.104807: step: 1340/530, loss: 0.00604582391679287 2023-01-22 18:08:30.196601: step: 1344/530, loss: 0.0007604804704897106 2023-01-22 18:08:31.347110: step: 1348/530, loss: 0.042319100350141525 2023-01-22 18:08:32.425167: step: 1352/530, loss: 0.0055596185848116875 2023-01-22 18:08:33.508577: step: 1356/530, loss: 0.006614349782466888 2023-01-22 18:08:34.606768: step: 1360/530, loss: 0.002728455699980259 2023-01-22 18:08:35.684082: step: 1364/530, loss: 0.0019447727827355266 2023-01-22 18:08:36.767797: step: 1368/530, loss: 0.03412714973092079 2023-01-22 18:08:37.857017: step: 1372/530, loss: 0.008057081140577793 2023-01-22 18:08:38.944020: step: 1376/530, loss: 0.009723569266498089 2023-01-22 18:08:40.011568: step: 1380/530, loss: 0.0020942145492881536 2023-01-22 18:08:41.096717: step: 1384/530, loss: 0.037779707461595535 2023-01-22 18:08:42.192708: step: 1388/530, loss: 0.004162820987403393 2023-01-22 18:08:43.307341: step: 1392/530, loss: 0.0030314435716718435 2023-01-22 18:08:44.406770: step: 1396/530, loss: 0.008005054667592049 2023-01-22 18:08:45.492519: step: 1400/530, loss: 0.015445479191839695 2023-01-22 18:08:46.585843: step: 1404/530, loss: 0.0054588885977864265 2023-01-22 18:08:47.680498: step: 1408/530, loss: 0.0009541259496472776 2023-01-22 18:08:48.769319: step: 1412/530, loss: 3.309938983875327e-05 2023-01-22 18:08:49.888134: step: 1416/530, loss: 0.0037648354191333055 2023-01-22 18:08:50.994381: step: 1420/530, loss: 0.009427951648831367 2023-01-22 18:08:52.096133: step: 1424/530, loss: 0.00912496168166399 2023-01-22 18:08:53.164836: step: 1428/530, loss: 0.0034798718988895416 2023-01-22 18:08:54.258272: step: 1432/530, loss: 0.0017370186978951097 2023-01-22 18:08:55.346814: step: 1436/530, loss: 0.00719187268987298 2023-01-22 18:08:56.434485: step: 1440/530, loss: 0.012083577923476696 2023-01-22 18:08:57.517551: step: 1444/530, loss: 0.029020706191658974 2023-01-22 18:08:58.626546: step: 1448/530, loss: 0.019146781414747238 2023-01-22 18:08:59.727142: step: 1452/530, loss: 0.004539281129837036 2023-01-22 18:09:00.809006: step: 1456/530, loss: 0.0032251356169581413 2023-01-22 18:09:01.915325: step: 1460/530, loss: 0.005161783192306757 2023-01-22 18:09:03.006513: step: 1464/530, loss: 0.002296453109011054 2023-01-22 18:09:04.088623: step: 1468/530, loss: 0.014328506775200367 2023-01-22 18:09:05.199820: step: 1472/530, loss: 0.025557201355695724 2023-01-22 18:09:06.297624: step: 1476/530, loss: 0.024794891476631165 2023-01-22 18:09:07.378837: step: 1480/530, loss: 0.003375542815774679 2023-01-22 18:09:08.496546: step: 1484/530, loss: 0.039767853915691376 2023-01-22 18:09:09.598746: step: 1488/530, loss: 0.005468260031193495 2023-01-22 18:09:10.688107: step: 1492/530, loss: 0.008726963773369789 2023-01-22 18:09:11.814112: step: 1496/530, loss: 0.005459923762828112 2023-01-22 18:09:12.917315: step: 1500/530, loss: 0.0030650740955024958 2023-01-22 18:09:14.014441: step: 1504/530, loss: 0.0014649203512817621 2023-01-22 18:09:15.117006: step: 1508/530, loss: 0.005837735719978809 2023-01-22 18:09:16.191452: step: 1512/530, loss: 0.0023033074103295803 2023-01-22 18:09:17.295855: step: 1516/530, loss: 0.008538995869457722 2023-01-22 18:09:18.385489: step: 1520/530, loss: 0.02530035749077797 2023-01-22 18:09:19.465535: step: 1524/530, loss: 0.0003509093075990677 2023-01-22 18:09:20.579078: step: 1528/530, loss: 0.0025637757498770952 2023-01-22 18:09:21.670775: step: 1532/530, loss: 0.023431751877069473 2023-01-22 18:09:22.759691: step: 1536/530, loss: 0.02613828144967556 2023-01-22 18:09:23.855851: step: 1540/530, loss: 0.02312270551919937 2023-01-22 18:09:24.962923: step: 1544/530, loss: 0.012337801046669483 2023-01-22 18:09:26.068992: step: 1548/530, loss: 0.00269088102504611 2023-01-22 18:09:27.163979: step: 1552/530, loss: 0.04785211756825447 2023-01-22 18:09:28.251712: step: 1556/530, loss: 0.005905095022171736 2023-01-22 18:09:29.347070: step: 1560/530, loss: 0.002391225891187787 2023-01-22 18:09:30.451546: step: 1564/530, loss: 0.0015557766892015934 2023-01-22 18:09:31.540308: step: 1568/530, loss: 0.004008970223367214 2023-01-22 18:09:32.637575: step: 1572/530, loss: 0.01488753966987133 2023-01-22 18:09:33.727262: step: 1576/530, loss: 0.005019379314035177 2023-01-22 18:09:34.817653: step: 1580/530, loss: 0.013527367264032364 2023-01-22 18:09:35.906829: step: 1584/530, loss: 0.0021498952992260456 2023-01-22 18:09:37.016396: step: 1588/530, loss: 0.0205497145652771 2023-01-22 18:09:38.100520: step: 1592/530, loss: 0.0015079585136845708 2023-01-22 18:09:39.209680: step: 1596/530, loss: 0.020550483837723732 2023-01-22 18:09:40.298588: step: 1600/530, loss: 0.014292348176240921 2023-01-22 18:09:41.396016: step: 1604/530, loss: 0.000968808657489717 2023-01-22 18:09:42.499075: step: 1608/530, loss: 0.014684724621474743 2023-01-22 18:09:43.596972: step: 1612/530, loss: 0.011075002141296864 2023-01-22 18:09:44.709149: step: 1616/530, loss: 0.06649428606033325 2023-01-22 18:09:45.790481: step: 1620/530, loss: 0.00946545135229826 2023-01-22 18:09:46.880912: step: 1624/530, loss: 0.008289055898785591 2023-01-22 18:09:47.992795: step: 1628/530, loss: 0.0059280553832650185 2023-01-22 18:09:49.107353: step: 1632/530, loss: 0.008240843191742897 2023-01-22 18:09:50.235835: step: 1636/530, loss: 0.033979691565036774 2023-01-22 18:09:51.342487: step: 1640/530, loss: 0.007574205752462149 2023-01-22 18:09:52.421244: step: 1644/530, loss: 0.03126741573214531 2023-01-22 18:09:53.507286: step: 1648/530, loss: 0.028560157865285873 2023-01-22 18:09:54.596955: step: 1652/530, loss: 0.009541143663227558 2023-01-22 18:09:55.682679: step: 1656/530, loss: 0.0100101288408041 2023-01-22 18:09:56.772505: step: 1660/530, loss: 0.0022494872100651264 2023-01-22 18:09:57.853709: step: 1664/530, loss: 0.00710147712379694 2023-01-22 18:09:58.948791: step: 1668/530, loss: 0.03679417818784714 2023-01-22 18:10:00.070722: step: 1672/530, loss: 0.00597589323297143 2023-01-22 18:10:01.210699: step: 1676/530, loss: 0.012171313166618347 2023-01-22 18:10:02.303164: step: 1680/530, loss: 0.008749675005674362 2023-01-22 18:10:03.404064: step: 1684/530, loss: 0.026481980457901955 2023-01-22 18:10:04.507054: step: 1688/530, loss: 0.00019856475410051644 2023-01-22 18:10:05.594364: step: 1692/530, loss: 0.011157437227666378 2023-01-22 18:10:06.687098: step: 1696/530, loss: 0.025775246322155 2023-01-22 18:10:07.781350: step: 1700/530, loss: 0.0011197603307664394 2023-01-22 18:10:08.870891: step: 1704/530, loss: 0.0034876095596700907 2023-01-22 18:10:09.955693: step: 1708/530, loss: 0.04879726469516754 2023-01-22 18:10:11.031496: step: 1712/530, loss: 0.013412362895905972 2023-01-22 18:10:12.123183: step: 1716/530, loss: 0.007574820425361395 2023-01-22 18:10:13.211410: step: 1720/530, loss: 0.0028674439527094364 2023-01-22 18:10:14.329068: step: 1724/530, loss: 0.029380347579717636 2023-01-22 18:10:15.421406: step: 1728/530, loss: 0.005109013058245182 2023-01-22 18:10:16.503559: step: 1732/530, loss: 0.03197004273533821 2023-01-22 18:10:17.587738: step: 1736/530, loss: 0.007782723754644394 2023-01-22 18:10:18.661844: step: 1740/530, loss: 0.003919995855540037 2023-01-22 18:10:19.777977: step: 1744/530, loss: 0.0074639832600951195 2023-01-22 18:10:20.882440: step: 1748/530, loss: 0.008496605791151524 2023-01-22 18:10:21.981869: step: 1752/530, loss: 0.01595201902091503 2023-01-22 18:10:23.095699: step: 1756/530, loss: 0.008883570320904255 2023-01-22 18:10:24.190742: step: 1760/530, loss: 0.005591331049799919 2023-01-22 18:10:25.303514: step: 1764/530, loss: 0.005617531016469002 2023-01-22 18:10:26.394918: step: 1768/530, loss: 0.004801840055733919 2023-01-22 18:10:27.478115: step: 1772/530, loss: 0.0046240827068686485 2023-01-22 18:10:28.557634: step: 1776/530, loss: 0.0027022850699722767 2023-01-22 18:10:29.667430: step: 1780/530, loss: 0.003939067013561726 2023-01-22 18:10:30.761215: step: 1784/530, loss: 0.0007597700459882617 2023-01-22 18:10:31.870012: step: 1788/530, loss: 0.03544655442237854 2023-01-22 18:10:32.957009: step: 1792/530, loss: 0.01583850011229515 2023-01-22 18:10:34.022544: step: 1796/530, loss: 0.023905564099550247 2023-01-22 18:10:35.115911: step: 1800/530, loss: 0.012000749818980694 2023-01-22 18:10:36.222355: step: 1804/530, loss: 0.014172019436955452 2023-01-22 18:10:37.309969: step: 1808/530, loss: 0.009804642759263515 2023-01-22 18:10:38.406221: step: 1812/530, loss: 0.011192088015377522 2023-01-22 18:10:39.479564: step: 1816/530, loss: 0.009174440056085587 2023-01-22 18:10:40.589679: step: 1820/530, loss: 0.0028696416411548853 2023-01-22 18:10:41.690711: step: 1824/530, loss: 0.0006159775657579303 2023-01-22 18:10:42.815527: step: 1828/530, loss: 0.007845573127269745 2023-01-22 18:10:43.889617: step: 1832/530, loss: 0.006900114007294178 2023-01-22 18:10:44.968874: step: 1836/530, loss: 0.000597308506257832 2023-01-22 18:10:46.031167: step: 1840/530, loss: 0.0013562479289248586 2023-01-22 18:10:47.129911: step: 1844/530, loss: 0.018411412835121155 2023-01-22 18:10:48.218134: step: 1848/530, loss: 0.02957063913345337 2023-01-22 18:10:49.309061: step: 1852/530, loss: 0.004262606613337994 2023-01-22 18:10:50.381058: step: 1856/530, loss: 0.0008446556748822331 2023-01-22 18:10:51.461062: step: 1860/530, loss: 0.003785383189097047 2023-01-22 18:10:52.547931: step: 1864/530, loss: 0.017457813024520874 2023-01-22 18:10:53.663424: step: 1868/530, loss: 0.016903871670365334 2023-01-22 18:10:54.767289: step: 1872/530, loss: 0.00910563487559557 2023-01-22 18:10:55.860332: step: 1876/530, loss: 0.0024856175296008587 2023-01-22 18:10:56.972457: step: 1880/530, loss: 0.01771523617208004 2023-01-22 18:10:58.085690: step: 1884/530, loss: 0.0037364992313086987 2023-01-22 18:10:59.170472: step: 1888/530, loss: 0.007870021276175976 2023-01-22 18:11:00.252357: step: 1892/530, loss: 0.006785782054066658 2023-01-22 18:11:01.328128: step: 1896/530, loss: 0.004140164237469435 2023-01-22 18:11:02.436052: step: 1900/530, loss: 0.011881887912750244 2023-01-22 18:11:03.544940: step: 1904/530, loss: 0.01027042604982853 2023-01-22 18:11:04.623035: step: 1908/530, loss: 0.0076409000903368 2023-01-22 18:11:05.707716: step: 1912/530, loss: 0.00034652548492886126 2023-01-22 18:11:06.786999: step: 1916/530, loss: 0.023433564230799675 2023-01-22 18:11:07.867951: step: 1920/530, loss: 0.005476299673318863 2023-01-22 18:11:08.988365: step: 1924/530, loss: 0.0087105268612504 2023-01-22 18:11:10.071961: step: 1928/530, loss: 0.003965376410633326 2023-01-22 18:11:11.179139: step: 1932/530, loss: 0.014118590392172337 2023-01-22 18:11:12.296274: step: 1936/530, loss: 0.007075015921145678 2023-01-22 18:11:13.371333: step: 1940/530, loss: 0.003730004420503974 2023-01-22 18:11:14.449319: step: 1944/530, loss: 0.010544252581894398 2023-01-22 18:11:15.543878: step: 1948/530, loss: 0.003539704019203782 2023-01-22 18:11:16.639625: step: 1952/530, loss: 0.02847655676305294 2023-01-22 18:11:17.751157: step: 1956/530, loss: 0.008167409338057041 2023-01-22 18:11:18.840659: step: 1960/530, loss: 0.00765496538951993 2023-01-22 18:11:19.922477: step: 1964/530, loss: 0.009911566972732544 2023-01-22 18:11:21.028760: step: 1968/530, loss: 0.004691366571933031 2023-01-22 18:11:22.101733: step: 1972/530, loss: 0.004511936567723751 2023-01-22 18:11:23.187808: step: 1976/530, loss: 0.003240075660869479 2023-01-22 18:11:24.284532: step: 1980/530, loss: 0.0009990454418584704 2023-01-22 18:11:25.375214: step: 1984/530, loss: 0.0037197726778686047 2023-01-22 18:11:26.464803: step: 1988/530, loss: 0.010630200617015362 2023-01-22 18:11:27.570062: step: 1992/530, loss: 0.03566709905862808 2023-01-22 18:11:28.639211: step: 1996/530, loss: 0.030046110972762108 2023-01-22 18:11:29.756501: step: 2000/530, loss: 0.043111298233270645 2023-01-22 18:11:30.842647: step: 2004/530, loss: 0.0023429833818227053 2023-01-22 18:11:31.953909: step: 2008/530, loss: 0.004607904702425003 2023-01-22 18:11:33.054508: step: 2012/530, loss: 0.017392003908753395 2023-01-22 18:11:34.148180: step: 2016/530, loss: 0.002853038487955928 2023-01-22 18:11:35.232687: step: 2020/530, loss: 0.020979465916752815 2023-01-22 18:11:36.313365: step: 2024/530, loss: 0.00715996976941824 2023-01-22 18:11:37.389751: step: 2028/530, loss: 0.0042402432300150394 2023-01-22 18:11:38.458845: step: 2032/530, loss: 0.002821543486788869 2023-01-22 18:11:39.553880: step: 2036/530, loss: 0.0031747843604534864 2023-01-22 18:11:40.635770: step: 2040/530, loss: 0.010959334671497345 2023-01-22 18:11:41.716277: step: 2044/530, loss: 0.00917725171893835 2023-01-22 18:11:42.809901: step: 2048/530, loss: 0.039017170667648315 2023-01-22 18:11:43.898523: step: 2052/530, loss: 0.0003101283800788224 2023-01-22 18:11:44.998827: step: 2056/530, loss: 0.002798594068735838 2023-01-22 18:11:46.076359: step: 2060/530, loss: 0.005760581232607365 2023-01-22 18:11:47.150943: step: 2064/530, loss: 0.016744490712881088 2023-01-22 18:11:48.233970: step: 2068/530, loss: 0.010294698178768158 2023-01-22 18:11:49.326244: step: 2072/530, loss: 0.024722643196582794 2023-01-22 18:11:50.410041: step: 2076/530, loss: 0.003681193571537733 2023-01-22 18:11:51.489476: step: 2080/530, loss: 0.0052399770356714725 2023-01-22 18:11:52.566313: step: 2084/530, loss: 0.00033079757122322917 2023-01-22 18:11:53.639895: step: 2088/530, loss: 0.002503804164007306 2023-01-22 18:11:54.729228: step: 2092/530, loss: 0.015386294573545456 2023-01-22 18:11:55.812396: step: 2096/530, loss: 0.006947911344468594 2023-01-22 18:11:56.902375: step: 2100/530, loss: 0.0018436722457408905 2023-01-22 18:11:57.989973: step: 2104/530, loss: 0.038152843713760376 2023-01-22 18:11:59.061325: step: 2108/530, loss: 0.006926866713911295 2023-01-22 18:12:00.152920: step: 2112/530, loss: 0.01697811484336853 2023-01-22 18:12:01.260445: step: 2116/530, loss: 0.01982099376618862 2023-01-22 18:12:02.359517: step: 2120/530, loss: 0.007340516895055771 ================================================== Loss: 0.012 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33898487773487773, 'r': 0.3569954594741122, 'f1': 0.34775712965407973}, 'combined': 0.25624209553458505, 'stategy': 1, 'epoch': 5} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.334818683740225, 'r': 0.2877917271713704, 'f1': 0.30952918741516544}, 'combined': 0.1922339163946817, 'stategy': 1, 'epoch': 5} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34704940385073585, 'r': 0.3417811017049941, 'f1': 0.3443951063069443}, 'combined': 0.2537648151735379, 'stategy': 1, 'epoch': 5} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31923840478968935, 'r': 0.2873461408097105, 'f1': 0.3024538764795599}, 'combined': 0.1878397759188846, 'stategy': 1, 'epoch': 5} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3471622333667169, 'r': 0.331352188583413, 'f1': 0.3390730162785604}, 'combined': 0.24984327515262345, 'stategy': 1, 'epoch': 5} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.344671684876126, 'r': 0.2936344166318823, 'f1': 0.31711264823890906}, 'combined': 0.19694364469574352, 'stategy': 1, 'epoch': 5} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 5} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.375, 'r': 0.5217391304347826, 'f1': 0.43636363636363634}, 'combined': 0.21818181818181817, 'stategy': 1, 'epoch': 5} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 5} New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3471622333667169, 'r': 0.331352188583413, 'f1': 0.3390730162785604}, 'combined': 0.24984327515262345, 'stategy': 1, 'epoch': 5} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.344671684876126, 'r': 0.2936344166318823, 'f1': 0.31711264823890906}, 'combined': 0.19694364469574352, 'stategy': 1, 'epoch': 5} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 5} ****************************** Epoch: 6 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 18:14:43.457192: step: 4/530, loss: 0.013390426523983479 2023-01-22 18:14:44.551271: step: 8/530, loss: 0.003913471940904856 2023-01-22 18:14:45.651283: step: 12/530, loss: 0.014675590209662914 2023-01-22 18:14:46.732708: step: 16/530, loss: 0.0025220257230103016 2023-01-22 18:14:47.859174: step: 20/530, loss: 0.0057050203904509544 2023-01-22 18:14:48.930135: step: 24/530, loss: 0.019459763541817665 2023-01-22 18:14:50.023342: step: 28/530, loss: 0.06323400139808655 2023-01-22 18:14:51.139123: step: 32/530, loss: 0.019175894558429718 2023-01-22 18:14:52.229445: step: 36/530, loss: 0.0103736761957407 2023-01-22 18:14:53.316363: step: 40/530, loss: 0.0025775940157473087 2023-01-22 18:14:54.435898: step: 44/530, loss: 0.001016054768115282 2023-01-22 18:14:55.523564: step: 48/530, loss: 0.01773722842335701 2023-01-22 18:14:56.608581: step: 52/530, loss: 0.005342042539268732 2023-01-22 18:14:57.686111: step: 56/530, loss: 0.01565561257302761 2023-01-22 18:14:58.768778: step: 60/530, loss: 0.004726297687739134 2023-01-22 18:14:59.850249: step: 64/530, loss: 0.016036001965403557 2023-01-22 18:15:00.946125: step: 68/530, loss: 0.004280498716980219 2023-01-22 18:15:02.054434: step: 72/530, loss: 0.016028283163905144 2023-01-22 18:15:03.178165: step: 76/530, loss: 0.0032032765448093414 2023-01-22 18:15:04.268449: step: 80/530, loss: 0.0050194598734378815 2023-01-22 18:15:05.346652: step: 84/530, loss: 0.0064005437307059765 2023-01-22 18:15:06.453946: step: 88/530, loss: 0.002755015389993787 2023-01-22 18:15:07.562029: step: 92/530, loss: 0.006801757495850325 2023-01-22 18:15:08.663563: step: 96/530, loss: 0.004431865178048611 2023-01-22 18:15:09.751817: step: 100/530, loss: 0.006601641420274973 2023-01-22 18:15:10.858708: step: 104/530, loss: 0.014659630134701729 2023-01-22 18:15:11.967392: step: 108/530, loss: 0.013820094987750053 2023-01-22 18:15:13.035262: step: 112/530, loss: 0.0010037426836788654 2023-01-22 18:15:14.100229: step: 116/530, loss: 0.008951479569077492 2023-01-22 18:15:15.197257: step: 120/530, loss: 0.007594216149300337 2023-01-22 18:15:16.282451: step: 124/530, loss: 0.004729499574750662 2023-01-22 18:15:17.362557: step: 128/530, loss: 0.022528061643242836 2023-01-22 18:15:18.454735: step: 132/530, loss: 0.005706608761101961 2023-01-22 18:15:19.556953: step: 136/530, loss: 0.01574314758181572 2023-01-22 18:15:20.649511: step: 140/530, loss: 0.002276085317134857 2023-01-22 18:15:21.760019: step: 144/530, loss: 0.018506066873669624 2023-01-22 18:15:22.844600: step: 148/530, loss: 0.01409124955534935 2023-01-22 18:15:23.927128: step: 152/530, loss: 0.009515224024653435 2023-01-22 18:15:24.998645: step: 156/530, loss: 0.014751598238945007 2023-01-22 18:15:26.080995: step: 160/530, loss: 0.004073361866176128 2023-01-22 18:15:27.148527: step: 164/530, loss: 0.001871665590442717 2023-01-22 18:15:28.242492: step: 168/530, loss: 0.005623673088848591 2023-01-22 18:15:29.320457: step: 172/530, loss: 0.006894161459058523 2023-01-22 18:15:30.386818: step: 176/530, loss: 0.0040574087761342525 2023-01-22 18:15:31.481163: step: 180/530, loss: 0.0001293703098781407 2023-01-22 18:15:32.561913: step: 184/530, loss: 0.009348595514893532 2023-01-22 18:15:33.676966: step: 188/530, loss: 0.0010552923195064068 2023-01-22 18:15:34.762101: step: 192/530, loss: 0.00040406209882348776 2023-01-22 18:15:35.847854: step: 196/530, loss: 0.013306169770658016 2023-01-22 18:15:36.938447: step: 200/530, loss: 0.02009774185717106 2023-01-22 18:15:38.028355: step: 204/530, loss: 0.012250389903783798 2023-01-22 18:15:39.137422: step: 208/530, loss: 0.003727343864738941 2023-01-22 18:15:40.245336: step: 212/530, loss: 0.004510779399424791 2023-01-22 18:15:41.351285: step: 216/530, loss: 0.008073188364505768 2023-01-22 18:15:42.424347: step: 220/530, loss: 0.06214343011379242 2023-01-22 18:15:43.501245: step: 224/530, loss: 0.005105390213429928 2023-01-22 18:15:44.588519: step: 228/530, loss: 0.0036071166396141052 2023-01-22 18:15:45.663217: step: 232/530, loss: 0.004965350031852722 2023-01-22 18:15:46.733293: step: 236/530, loss: 0.008593683131039143 2023-01-22 18:15:47.836421: step: 240/530, loss: 0.0011923352722078562 2023-01-22 18:15:48.927906: step: 244/530, loss: 0.009273329749703407 2023-01-22 18:15:50.016317: step: 248/530, loss: 0.015437302179634571 2023-01-22 18:15:51.091648: step: 252/530, loss: 0.0029063429683446884 2023-01-22 18:15:52.201744: step: 256/530, loss: 0.0029965871945023537 2023-01-22 18:15:53.298992: step: 260/530, loss: 0.015377046540379524 2023-01-22 18:15:54.375396: step: 264/530, loss: 0.00244529964402318 2023-01-22 18:15:55.485886: step: 268/530, loss: 0.008787153288722038 2023-01-22 18:15:56.578404: step: 272/530, loss: 0.011790621094405651 2023-01-22 18:15:57.678224: step: 276/530, loss: 0.00617571035400033 2023-01-22 18:15:58.804425: step: 280/530, loss: 0.01603359915316105 2023-01-22 18:15:59.892760: step: 284/530, loss: 0.003708968637511134 2023-01-22 18:16:01.011280: step: 288/530, loss: 0.0037179531063884497 2023-01-22 18:16:02.101076: step: 292/530, loss: 0.0053726742044091225 2023-01-22 18:16:03.190006: step: 296/530, loss: 0.006987280212342739 2023-01-22 18:16:04.299326: step: 300/530, loss: 0.05322657898068428 2023-01-22 18:16:05.381815: step: 304/530, loss: 0.00358753465116024 2023-01-22 18:16:06.459106: step: 308/530, loss: 0.0012447584886103868 2023-01-22 18:16:07.544023: step: 312/530, loss: 0.012272996827960014 2023-01-22 18:16:08.650036: step: 316/530, loss: 0.024080568924546242 2023-01-22 18:16:09.729758: step: 320/530, loss: 0.0021521628368645906 2023-01-22 18:16:10.829101: step: 324/530, loss: 0.0011233440600335598 2023-01-22 18:16:11.943834: step: 328/530, loss: 0.016007384285330772 2023-01-22 18:16:13.050539: step: 332/530, loss: 0.006393632385879755 2023-01-22 18:16:14.162628: step: 336/530, loss: 0.008048313669860363 2023-01-22 18:16:15.265372: step: 340/530, loss: 0.0035647025797516108 2023-01-22 18:16:16.377751: step: 344/530, loss: 0.01215900294482708 2023-01-22 18:16:17.440679: step: 348/530, loss: 0.004934570752084255 2023-01-22 18:16:18.541606: step: 352/530, loss: 0.0035738968290388584 2023-01-22 18:16:19.617288: step: 356/530, loss: 0.005652283318340778 2023-01-22 18:16:20.718126: step: 360/530, loss: 0.02595125138759613 2023-01-22 18:16:21.815401: step: 364/530, loss: 0.009565915912389755 2023-01-22 18:16:22.901049: step: 368/530, loss: 0.0006659716018475592 2023-01-22 18:16:23.972412: step: 372/530, loss: 0.004813600331544876 2023-01-22 18:16:25.094792: step: 376/530, loss: 0.003479395294561982 2023-01-22 18:16:26.190307: step: 380/530, loss: 0.002324026543647051 2023-01-22 18:16:27.301915: step: 384/530, loss: 0.005483194720000029 2023-01-22 18:16:28.401580: step: 388/530, loss: 0.004847073927521706 2023-01-22 18:16:29.494605: step: 392/530, loss: 0.007429624442011118 2023-01-22 18:16:30.596204: step: 396/530, loss: 0.008476309478282928 2023-01-22 18:16:31.687998: step: 400/530, loss: 0.0029982924461364746 2023-01-22 18:16:32.769455: step: 404/530, loss: 0.00288561312481761 2023-01-22 18:16:33.865996: step: 408/530, loss: 0.014835940673947334 2023-01-22 18:16:34.961232: step: 412/530, loss: 0.019096961244940758 2023-01-22 18:16:36.052847: step: 416/530, loss: 0.009492441080510616 2023-01-22 18:16:37.129805: step: 420/530, loss: 0.006955127697438002 2023-01-22 18:16:38.210832: step: 424/530, loss: 0.005792070180177689 2023-01-22 18:16:39.283363: step: 428/530, loss: 0.0008928178576752543 2023-01-22 18:16:40.413060: step: 432/530, loss: 0.01803162321448326 2023-01-22 18:16:41.508188: step: 436/530, loss: 0.0005017681396566331 2023-01-22 18:16:42.628706: step: 440/530, loss: 0.02273922599852085 2023-01-22 18:16:43.715254: step: 444/530, loss: 0.008860909380018711 2023-01-22 18:16:44.794623: step: 448/530, loss: 0.006418897304683924 2023-01-22 18:16:45.907580: step: 452/530, loss: 0.006321071647107601 2023-01-22 18:16:47.001240: step: 456/530, loss: 0.0008852732717059553 2023-01-22 18:16:48.093462: step: 460/530, loss: 0.06455767154693604 2023-01-22 18:16:49.206118: step: 464/530, loss: 0.011337414383888245 2023-01-22 18:16:50.311241: step: 468/530, loss: 0.03129412606358528 2023-01-22 18:16:51.402381: step: 472/530, loss: 0.005267268046736717 2023-01-22 18:16:52.477183: step: 476/530, loss: 0.005748947616666555 2023-01-22 18:16:53.546811: step: 480/530, loss: 0.016402380540966988 2023-01-22 18:16:54.626262: step: 484/530, loss: 0.0032799935434013605 2023-01-22 18:16:55.729952: step: 488/530, loss: 0.012513834051787853 2023-01-22 18:16:56.829660: step: 492/530, loss: 0.0026917611248791218 2023-01-22 18:16:57.925347: step: 496/530, loss: 0.0060631581582129 2023-01-22 18:16:59.014462: step: 500/530, loss: 0.0032556792721152306 2023-01-22 18:17:00.110360: step: 504/530, loss: 0.0029229968786239624 2023-01-22 18:17:01.186352: step: 508/530, loss: 0.00792235229164362 2023-01-22 18:17:02.282163: step: 512/530, loss: 0.014967920258641243 2023-01-22 18:17:03.403272: step: 516/530, loss: 0.006878642365336418 2023-01-22 18:17:04.511673: step: 520/530, loss: 0.004619373008608818 2023-01-22 18:17:05.586998: step: 524/530, loss: 0.002735935617238283 2023-01-22 18:17:06.679490: step: 528/530, loss: 0.007665351964533329 2023-01-22 18:17:07.773791: step: 532/530, loss: 0.013482710346579552 2023-01-22 18:17:08.854928: step: 536/530, loss: 0.024530954658985138 2023-01-22 18:17:09.945808: step: 540/530, loss: 0.0028515001758933067 2023-01-22 18:17:11.044643: step: 544/530, loss: 0.00530988909304142 2023-01-22 18:17:12.135857: step: 548/530, loss: 0.000554635189473629 2023-01-22 18:17:13.230840: step: 552/530, loss: 0.013563115149736404 2023-01-22 18:17:14.308790: step: 556/530, loss: 0.0022188678849488497 2023-01-22 18:17:15.416785: step: 560/530, loss: 0.022701134905219078 2023-01-22 18:17:16.515304: step: 564/530, loss: 0.00687677226960659 2023-01-22 18:17:17.622008: step: 568/530, loss: 0.007060638628900051 2023-01-22 18:17:18.732170: step: 572/530, loss: 0.0007632538327015936 2023-01-22 18:17:19.848751: step: 576/530, loss: 0.0009229238494299352 2023-01-22 18:17:20.942423: step: 580/530, loss: 0.018368715420365334 2023-01-22 18:17:22.075805: step: 584/530, loss: 0.006042899563908577 2023-01-22 18:17:23.185283: step: 588/530, loss: 0.01982397586107254 2023-01-22 18:17:24.272023: step: 592/530, loss: 0.0013868712121620774 2023-01-22 18:17:25.355921: step: 596/530, loss: 0.0015452922089025378 2023-01-22 18:17:26.448127: step: 600/530, loss: 0.0050039151683449745 2023-01-22 18:17:27.536257: step: 604/530, loss: 0.002873511053621769 2023-01-22 18:17:28.653101: step: 608/530, loss: 0.01189162116497755 2023-01-22 18:17:29.736909: step: 612/530, loss: 0.010051965713500977 2023-01-22 18:17:30.828265: step: 616/530, loss: 0.006220933981239796 2023-01-22 18:17:31.929619: step: 620/530, loss: 0.007419348694384098 2023-01-22 18:17:33.010414: step: 624/530, loss: 0.014715871773660183 2023-01-22 18:17:34.095235: step: 628/530, loss: 0.0012297948123887181 2023-01-22 18:17:35.195079: step: 632/530, loss: 0.014310983009636402 2023-01-22 18:17:36.293266: step: 636/530, loss: 0.008859928697347641 2023-01-22 18:17:37.387464: step: 640/530, loss: 0.009216432459652424 2023-01-22 18:17:38.482384: step: 644/530, loss: 0.004318630788475275 2023-01-22 18:17:39.587850: step: 648/530, loss: 0.05318840593099594 2023-01-22 18:17:40.692021: step: 652/530, loss: 0.0028300799895077944 2023-01-22 18:17:41.808474: step: 656/530, loss: 0.0064165182411670685 2023-01-22 18:17:42.934298: step: 660/530, loss: 0.013577465899288654 2023-01-22 18:17:44.015912: step: 664/530, loss: 0.02669849991798401 2023-01-22 18:17:45.085902: step: 668/530, loss: 0.0 2023-01-22 18:17:46.191877: step: 672/530, loss: 0.005146565847098827 2023-01-22 18:17:47.290381: step: 676/530, loss: 0.003153915284201503 2023-01-22 18:17:48.391513: step: 680/530, loss: 0.0021724035032093525 2023-01-22 18:17:49.498955: step: 684/530, loss: 0.008481604047119617 2023-01-22 18:17:50.586484: step: 688/530, loss: 0.014910262078046799 2023-01-22 18:17:51.690158: step: 692/530, loss: 0.0002634353586472571 2023-01-22 18:17:52.767510: step: 696/530, loss: 0.0005372039158828557 2023-01-22 18:17:53.859800: step: 700/530, loss: 0.002919894177466631 2023-01-22 18:17:54.953665: step: 704/530, loss: 0.016136229038238525 2023-01-22 18:17:56.037300: step: 708/530, loss: 0.007952974177896976 2023-01-22 18:17:57.117551: step: 712/530, loss: 0.0016320603899657726 2023-01-22 18:17:58.202952: step: 716/530, loss: 0.0067335935309529305 2023-01-22 18:17:59.282962: step: 720/530, loss: 0.020796235650777817 2023-01-22 18:18:00.395013: step: 724/530, loss: 0.010603051632642746 2023-01-22 18:18:01.525880: step: 728/530, loss: 0.0035867670085281134 2023-01-22 18:18:02.613430: step: 732/530, loss: 0.038410037755966187 2023-01-22 18:18:03.709925: step: 736/530, loss: 0.01595931313931942 2023-01-22 18:18:04.818548: step: 740/530, loss: 0.01142870169132948 2023-01-22 18:18:05.893608: step: 744/530, loss: 0.0003212083538528532 2023-01-22 18:18:07.003855: step: 748/530, loss: 0.006775077432394028 2023-01-22 18:18:08.097088: step: 752/530, loss: 0.004188289400190115 2023-01-22 18:18:09.190572: step: 756/530, loss: 0.009298007003962994 2023-01-22 18:18:10.276293: step: 760/530, loss: 0.01912320964038372 2023-01-22 18:18:11.364346: step: 764/530, loss: 0.012271419167518616 2023-01-22 18:18:12.476501: step: 768/530, loss: 0.00332202878780663 2023-01-22 18:18:13.544646: step: 772/530, loss: 0.0029262148309499025 2023-01-22 18:18:14.653924: step: 776/530, loss: 0.0008892411715351045 2023-01-22 18:18:15.735053: step: 780/530, loss: 0.011919665150344372 2023-01-22 18:18:16.824786: step: 784/530, loss: 0.01851597987115383 2023-01-22 18:18:17.890713: step: 788/530, loss: 0.0030852241907268763 2023-01-22 18:18:18.972042: step: 792/530, loss: 0.0036761611700057983 2023-01-22 18:18:20.061760: step: 796/530, loss: 0.003399947192519903 2023-01-22 18:18:21.159587: step: 800/530, loss: 0.006142581347376108 2023-01-22 18:18:22.246208: step: 804/530, loss: 0.023061295971274376 2023-01-22 18:18:23.363846: step: 808/530, loss: 0.008395311422646046 2023-01-22 18:18:24.464611: step: 812/530, loss: 0.026986798271536827 2023-01-22 18:18:25.573291: step: 816/530, loss: 0.01530088298022747 2023-01-22 18:18:26.680928: step: 820/530, loss: 0.07895203679800034 2023-01-22 18:18:27.759966: step: 824/530, loss: 0.007875069975852966 2023-01-22 18:18:28.858177: step: 828/530, loss: 0.022428033873438835 2023-01-22 18:18:29.952588: step: 832/530, loss: 0.00685987900942564 2023-01-22 18:18:31.052639: step: 836/530, loss: 0.005061048083007336 2023-01-22 18:18:32.143618: step: 840/530, loss: 0.005881423130631447 2023-01-22 18:18:33.227853: step: 844/530, loss: 0.0023010517470538616 2023-01-22 18:18:34.311190: step: 848/530, loss: 0.009259999729692936 2023-01-22 18:18:35.393572: step: 852/530, loss: 0.023595279082655907 2023-01-22 18:18:36.487414: step: 856/530, loss: 0.007073951885104179 2023-01-22 18:18:37.590737: step: 860/530, loss: 0.012977248057723045 2023-01-22 18:18:38.672701: step: 864/530, loss: 0.002038983628153801 2023-01-22 18:18:39.747933: step: 868/530, loss: 0.021646853536367416 2023-01-22 18:18:40.838316: step: 872/530, loss: 0.0034775726962834597 2023-01-22 18:18:41.930674: step: 876/530, loss: 0.002575481543317437 2023-01-22 18:18:43.028896: step: 880/530, loss: 0.016511347144842148 2023-01-22 18:18:44.110991: step: 884/530, loss: 0.007966233417391777 2023-01-22 18:18:45.227982: step: 888/530, loss: 0.0036477355752140284 2023-01-22 18:18:46.345099: step: 892/530, loss: 0.023912986740469933 2023-01-22 18:18:47.462032: step: 896/530, loss: 0.005340574309229851 2023-01-22 18:18:48.573410: step: 900/530, loss: 0.012384876608848572 2023-01-22 18:18:49.659540: step: 904/530, loss: 0.0006822962313890457 2023-01-22 18:18:50.721642: step: 908/530, loss: 0.02468578703701496 2023-01-22 18:18:51.805047: step: 912/530, loss: 0.01933750882744789 2023-01-22 18:18:52.881792: step: 916/530, loss: 0.008372031152248383 2023-01-22 18:18:53.982725: step: 920/530, loss: 0.015360166318714619 2023-01-22 18:18:55.104809: step: 924/530, loss: 0.014099378138780594 2023-01-22 18:18:56.181752: step: 928/530, loss: 0.004104915075004101 2023-01-22 18:18:57.275974: step: 932/530, loss: 0.004274293314665556 2023-01-22 18:18:58.357346: step: 936/530, loss: 0.013796493411064148 2023-01-22 18:18:59.459805: step: 940/530, loss: 0.004015969578176737 2023-01-22 18:19:00.549203: step: 944/530, loss: 0.029437707737088203 2023-01-22 18:19:01.640750: step: 948/530, loss: 0.06338165700435638 2023-01-22 18:19:02.744513: step: 952/530, loss: 0.006039412692189217 2023-01-22 18:19:03.828600: step: 956/530, loss: 0.004642699845135212 2023-01-22 18:19:04.916551: step: 960/530, loss: 0.001632447587326169 2023-01-22 18:19:06.022856: step: 964/530, loss: 0.0092964768409729 2023-01-22 18:19:07.112974: step: 968/530, loss: 0.003565976396203041 2023-01-22 18:19:08.204557: step: 972/530, loss: 0.0037259955424815416 2023-01-22 18:19:09.296195: step: 976/530, loss: 0.007760280277580023 2023-01-22 18:19:10.374106: step: 980/530, loss: 0.00566880265250802 2023-01-22 18:19:11.469956: step: 984/530, loss: 0.0024378288071602583 2023-01-22 18:19:12.592831: step: 988/530, loss: 0.006020046770572662 2023-01-22 18:19:13.718832: step: 992/530, loss: 0.02705455757677555 2023-01-22 18:19:14.812593: step: 996/530, loss: 0.0018895254470407963 2023-01-22 18:19:15.908165: step: 1000/530, loss: 0.0025461469776928425 2023-01-22 18:19:17.018854: step: 1004/530, loss: 0.0010933129815384746 2023-01-22 18:19:18.114663: step: 1008/530, loss: 0.010913295671343803 2023-01-22 18:19:19.224734: step: 1012/530, loss: 0.009694751352071762 2023-01-22 18:19:20.334239: step: 1016/530, loss: 0.027088673785328865 2023-01-22 18:19:21.417690: step: 1020/530, loss: 0.007128599099814892 2023-01-22 18:19:22.509751: step: 1024/530, loss: 0.043904609978199005 2023-01-22 18:19:23.616643: step: 1028/530, loss: 0.005110875703394413 2023-01-22 18:19:24.697651: step: 1032/530, loss: 0.005126473028212786 2023-01-22 18:19:25.788321: step: 1036/530, loss: 0.0054137264378368855 2023-01-22 18:19:26.866427: step: 1040/530, loss: 0.01349830161780119 2023-01-22 18:19:27.991264: step: 1044/530, loss: 0.005182754714041948 2023-01-22 18:19:29.082810: step: 1048/530, loss: 0.0028157818596810102 2023-01-22 18:19:30.182510: step: 1052/530, loss: 0.000210175960091874 2023-01-22 18:19:31.287711: step: 1056/530, loss: 0.01893300563097 2023-01-22 18:19:32.377753: step: 1060/530, loss: 0.013074495829641819 2023-01-22 18:19:33.476429: step: 1064/530, loss: 0.026199353858828545 2023-01-22 18:19:34.551369: step: 1068/530, loss: 0.0012763570994138718 2023-01-22 18:19:35.632535: step: 1072/530, loss: 0.000747830024920404 2023-01-22 18:19:36.717491: step: 1076/530, loss: 0.004875941667705774 2023-01-22 18:19:37.792641: step: 1080/530, loss: 0.02152143232524395 2023-01-22 18:19:38.888067: step: 1084/530, loss: 0.003370596095919609 2023-01-22 18:19:39.967283: step: 1088/530, loss: 0.0016149122966453433 2023-01-22 18:19:41.060577: step: 1092/530, loss: 0.02816551923751831 2023-01-22 18:19:42.155419: step: 1096/530, loss: 0.0006070274976082146 2023-01-22 18:19:43.225030: step: 1100/530, loss: 0.00011186282790731639 2023-01-22 18:19:44.356161: step: 1104/530, loss: 0.008155712857842445 2023-01-22 18:19:45.429934: step: 1108/530, loss: 0.0005338452174328268 2023-01-22 18:19:46.510563: step: 1112/530, loss: 0.006027278024703264 2023-01-22 18:19:47.625562: step: 1116/530, loss: 0.03878793120384216 2023-01-22 18:19:48.719549: step: 1120/530, loss: 0.00042224457138217986 2023-01-22 18:19:49.809053: step: 1124/530, loss: 0.0031638885848224163 2023-01-22 18:19:50.901129: step: 1128/530, loss: 0.007403148803859949 2023-01-22 18:19:51.976755: step: 1132/530, loss: 0.00174345588311553 2023-01-22 18:19:53.084549: step: 1136/530, loss: 0.014343636110424995 2023-01-22 18:19:54.170955: step: 1140/530, loss: 0.0018404264701530337 2023-01-22 18:19:55.248724: step: 1144/530, loss: 0.020351599901914597 2023-01-22 18:19:56.339444: step: 1148/530, loss: 0.008296698331832886 2023-01-22 18:19:57.451945: step: 1152/530, loss: 0.06742016226053238 2023-01-22 18:19:58.548775: step: 1156/530, loss: 0.0034034899435937405 2023-01-22 18:19:59.638095: step: 1160/530, loss: 0.010913080535829067 2023-01-22 18:20:00.737038: step: 1164/530, loss: 0.004154646303504705 2023-01-22 18:20:01.807071: step: 1168/530, loss: 0.01610121876001358 2023-01-22 18:20:02.911208: step: 1172/530, loss: 0.0050384271889925 2023-01-22 18:20:04.004676: step: 1176/530, loss: 0.004915058612823486 2023-01-22 18:20:05.121215: step: 1180/530, loss: 0.015269331634044647 2023-01-22 18:20:06.218203: step: 1184/530, loss: 0.029997672885656357 2023-01-22 18:20:07.311217: step: 1188/530, loss: 0.009049919433891773 2023-01-22 18:20:08.410749: step: 1192/530, loss: 0.018555831164121628 2023-01-22 18:20:09.489877: step: 1196/530, loss: 0.005224880296736956 2023-01-22 18:20:10.621418: step: 1200/530, loss: 0.0039734807796776295 2023-01-22 18:20:11.703037: step: 1204/530, loss: 0.006240292452275753 2023-01-22 18:20:12.818254: step: 1208/530, loss: 0.00665348069742322 2023-01-22 18:20:13.961959: step: 1212/530, loss: 0.03361654281616211 2023-01-22 18:20:15.036692: step: 1216/530, loss: 0.008245476521551609 2023-01-22 18:20:16.153379: step: 1220/530, loss: 0.022018421441316605 2023-01-22 18:20:17.282800: step: 1224/530, loss: 0.004142383113503456 2023-01-22 18:20:18.383750: step: 1228/530, loss: 0.007273348048329353 2023-01-22 18:20:19.474528: step: 1232/530, loss: 0.008193165995180607 2023-01-22 18:20:20.575730: step: 1236/530, loss: 0.005689043086022139 2023-01-22 18:20:21.673691: step: 1240/530, loss: 0.0005889005260542035 2023-01-22 18:20:22.770805: step: 1244/530, loss: 0.0018694591708481312 2023-01-22 18:20:23.850887: step: 1248/530, loss: 0.008512190543115139 2023-01-22 18:20:24.934234: step: 1252/530, loss: 0.00022736986284144223 2023-01-22 18:20:26.038842: step: 1256/530, loss: 0.007735078223049641 2023-01-22 18:20:27.136327: step: 1260/530, loss: 0.010479175485670567 2023-01-22 18:20:28.228376: step: 1264/530, loss: 0.004068239126354456 2023-01-22 18:20:29.311976: step: 1268/530, loss: 0.002515255706384778 2023-01-22 18:20:30.429932: step: 1272/530, loss: 0.0074677979573607445 2023-01-22 18:20:31.535551: step: 1276/530, loss: 0.00739635806530714 2023-01-22 18:20:32.602238: step: 1280/530, loss: 0.019201155751943588 2023-01-22 18:20:33.686238: step: 1284/530, loss: 0.0022439199965447187 2023-01-22 18:20:34.784958: step: 1288/530, loss: 0.003761469852179289 2023-01-22 18:20:35.867521: step: 1292/530, loss: 0.006268573924899101 2023-01-22 18:20:36.950900: step: 1296/530, loss: 0.0005840518279001117 2023-01-22 18:20:38.042596: step: 1300/530, loss: 0.06176234036684036 2023-01-22 18:20:39.147699: step: 1304/530, loss: 0.010002519004046917 2023-01-22 18:20:40.224536: step: 1308/530, loss: 0.0046221488155424595 2023-01-22 18:20:41.323333: step: 1312/530, loss: 0.006704976782202721 2023-01-22 18:20:42.426337: step: 1316/530, loss: 0.0013584103435277939 2023-01-22 18:20:43.518041: step: 1320/530, loss: 0.006341882050037384 2023-01-22 18:20:44.611215: step: 1324/530, loss: 0.017576860263943672 2023-01-22 18:20:45.731126: step: 1328/530, loss: 0.0009096225840039551 2023-01-22 18:20:46.827269: step: 1332/530, loss: 0.013372194953262806 2023-01-22 18:20:47.904719: step: 1336/530, loss: 0.006615982856601477 2023-01-22 18:20:48.998724: step: 1340/530, loss: 0.00839964859187603 2023-01-22 18:20:50.072442: step: 1344/530, loss: 0.019094789400696754 2023-01-22 18:20:51.163422: step: 1348/530, loss: 4.0409677239949815e-06 2023-01-22 18:20:52.258053: step: 1352/530, loss: 0.0063874367624521255 2023-01-22 18:20:53.350687: step: 1356/530, loss: 0.033885207027196884 2023-01-22 18:20:54.434685: step: 1360/530, loss: 0.004803528543561697 2023-01-22 18:20:55.505345: step: 1364/530, loss: 0.001461849664337933 2023-01-22 18:20:56.583267: step: 1368/530, loss: 0.004812730010598898 2023-01-22 18:20:57.646656: step: 1372/530, loss: 0.005526599008589983 2023-01-22 18:20:58.704159: step: 1376/530, loss: 6.95694106980227e-05 2023-01-22 18:20:59.795934: step: 1380/530, loss: 0.00903487578034401 2023-01-22 18:21:00.897055: step: 1384/530, loss: 0.006801504176110029 2023-01-22 18:21:01.964070: step: 1388/530, loss: 0.00288062053732574 2023-01-22 18:21:03.064645: step: 1392/530, loss: 0.03670917823910713 2023-01-22 18:21:04.151464: step: 1396/530, loss: 0.015249194577336311 2023-01-22 18:21:05.214392: step: 1400/530, loss: 0.0034498574677854776 2023-01-22 18:21:06.313991: step: 1404/530, loss: 0.009832950308918953 2023-01-22 18:21:07.424273: step: 1408/530, loss: 0.004163734614849091 2023-01-22 18:21:08.502161: step: 1412/530, loss: 0.008080611005425453 2023-01-22 18:21:09.585702: step: 1416/530, loss: 0.025228403508663177 2023-01-22 18:21:10.665328: step: 1420/530, loss: 0.007757321931421757 2023-01-22 18:21:11.805834: step: 1424/530, loss: 0.007283371407538652 2023-01-22 18:21:12.875513: step: 1428/530, loss: 0.0010529693681746721 2023-01-22 18:21:13.978399: step: 1432/530, loss: 0.010803609155118465 2023-01-22 18:21:15.073044: step: 1436/530, loss: 0.013553500175476074 2023-01-22 18:21:16.165115: step: 1440/530, loss: 0.006621817592531443 2023-01-22 18:21:17.257556: step: 1444/530, loss: 0.00014562037540599704 2023-01-22 18:21:18.359467: step: 1448/530, loss: 0.005476659629493952 2023-01-22 18:21:19.461930: step: 1452/530, loss: 0.018918126821517944 2023-01-22 18:21:20.537554: step: 1456/530, loss: 0.002413890790194273 2023-01-22 18:21:21.615680: step: 1460/530, loss: 0.008535767905414104 2023-01-22 18:21:22.689150: step: 1464/530, loss: 0.007015233859419823 2023-01-22 18:21:23.797589: step: 1468/530, loss: 0.018064122647047043 2023-01-22 18:21:24.917933: step: 1472/530, loss: 0.0024961926974356174 2023-01-22 18:21:25.995873: step: 1476/530, loss: 0.0014636997366324067 2023-01-22 18:21:27.086136: step: 1480/530, loss: 0.008846471086144447 2023-01-22 18:21:28.197055: step: 1484/530, loss: 0.0021048174239695072 2023-01-22 18:21:29.294144: step: 1488/530, loss: 0.0012592453276738524 2023-01-22 18:21:30.412127: step: 1492/530, loss: 0.002622247440740466 2023-01-22 18:21:31.522261: step: 1496/530, loss: 0.019220324233174324 2023-01-22 18:21:32.612169: step: 1500/530, loss: 0.018160155043005943 2023-01-22 18:21:33.717694: step: 1504/530, loss: 0.02214130386710167 2023-01-22 18:21:34.810451: step: 1508/530, loss: 0.004736586473882198 2023-01-22 18:21:35.918372: step: 1512/530, loss: 0.009976362809538841 2023-01-22 18:21:37.004651: step: 1516/530, loss: 0.04310748353600502 2023-01-22 18:21:38.099669: step: 1520/530, loss: 0.007466264069080353 2023-01-22 18:21:39.196704: step: 1524/530, loss: 0.002315219957381487 2023-01-22 18:21:40.281011: step: 1528/530, loss: 0.008697858080267906 2023-01-22 18:21:41.371004: step: 1532/530, loss: 0.0 2023-01-22 18:21:42.451815: step: 1536/530, loss: 0.00947598461061716 2023-01-22 18:21:43.523753: step: 1540/530, loss: 0.0004582456895150244 2023-01-22 18:21:44.613865: step: 1544/530, loss: 0.006739595904946327 2023-01-22 18:21:45.744618: step: 1548/530, loss: 0.012601654976606369 2023-01-22 18:21:46.819770: step: 1552/530, loss: 3.860785000142641e-06 2023-01-22 18:21:47.906204: step: 1556/530, loss: 0.05636851117014885 2023-01-22 18:21:48.989145: step: 1560/530, loss: 2.1893432858632877e-05 2023-01-22 18:21:50.089622: step: 1564/530, loss: 0.0017861186061054468 2023-01-22 18:21:51.170397: step: 1568/530, loss: 0.006397359538823366 2023-01-22 18:21:52.240902: step: 1572/530, loss: 0.003253550035879016 2023-01-22 18:21:53.334354: step: 1576/530, loss: 0.00168312294408679 2023-01-22 18:21:54.429934: step: 1580/530, loss: 0.004595127422362566 2023-01-22 18:21:55.523618: step: 1584/530, loss: 0.012165140360593796 2023-01-22 18:21:56.608472: step: 1588/530, loss: 0.006841971538960934 2023-01-22 18:21:57.686127: step: 1592/530, loss: 0.01632261648774147 2023-01-22 18:21:58.768673: step: 1596/530, loss: 7.958279456943274e-05 2023-01-22 18:21:59.856234: step: 1600/530, loss: 0.0028296750970184803 2023-01-22 18:22:00.971462: step: 1604/530, loss: 0.04016222804784775 2023-01-22 18:22:02.071929: step: 1608/530, loss: 0.004369673784822226 2023-01-22 18:22:03.174546: step: 1612/530, loss: 0.0026291189715266228 2023-01-22 18:22:04.266698: step: 1616/530, loss: 0.03938344120979309 2023-01-22 18:22:05.346075: step: 1620/530, loss: 0.0002474721986800432 2023-01-22 18:22:06.443314: step: 1624/530, loss: 0.015566072426736355 2023-01-22 18:22:07.539443: step: 1628/530, loss: 0.005241157487034798 2023-01-22 18:22:08.620149: step: 1632/530, loss: 0.012914786115288734 2023-01-22 18:22:09.710992: step: 1636/530, loss: 0.008136267773807049 2023-01-22 18:22:10.802030: step: 1640/530, loss: 0.007448459975421429 2023-01-22 18:22:11.906540: step: 1644/530, loss: 0.002437054179608822 2023-01-22 18:22:13.004523: step: 1648/530, loss: 0.0241682268679142 2023-01-22 18:22:14.082244: step: 1652/530, loss: 0.000406511127948761 2023-01-22 18:22:15.182784: step: 1656/530, loss: 0.0033410938922315836 2023-01-22 18:22:16.276031: step: 1660/530, loss: 0.0011541829444468021 2023-01-22 18:22:17.362517: step: 1664/530, loss: 0.0020975994411855936 2023-01-22 18:22:18.443632: step: 1668/530, loss: 0.013906214386224747 2023-01-22 18:22:19.520285: step: 1672/530, loss: 0.0036015575751662254 2023-01-22 18:22:20.646828: step: 1676/530, loss: 0.0009082278702408075 2023-01-22 18:22:21.755185: step: 1680/530, loss: 0.019838446751236916 2023-01-22 18:22:22.842861: step: 1684/530, loss: 0.0005814454052597284 2023-01-22 18:22:23.943899: step: 1688/530, loss: 0.004982032813131809 2023-01-22 18:22:25.007836: step: 1692/530, loss: 0.007635097019374371 2023-01-22 18:22:26.094596: step: 1696/530, loss: 0.004282320383936167 2023-01-22 18:22:27.170491: step: 1700/530, loss: 0.0013093005400151014 2023-01-22 18:22:28.258070: step: 1704/530, loss: 6.666172703262419e-05 2023-01-22 18:22:29.369862: step: 1708/530, loss: 0.0033410987816751003 2023-01-22 18:22:30.472486: step: 1712/530, loss: 0.014055160805583 2023-01-22 18:22:31.561588: step: 1716/530, loss: 0.0067917462438344955 2023-01-22 18:22:32.662808: step: 1720/530, loss: 0.006169333588331938 2023-01-22 18:22:33.756048: step: 1724/530, loss: 0.01123003475368023 2023-01-22 18:22:34.843529: step: 1728/530, loss: 0.00014782797370571643 2023-01-22 18:22:35.957554: step: 1732/530, loss: 0.005444451235234737 2023-01-22 18:22:37.058373: step: 1736/530, loss: 0.006503126583993435 2023-01-22 18:22:38.172930: step: 1740/530, loss: 0.01831994205713272 2023-01-22 18:22:39.264075: step: 1744/530, loss: 0.0007748312200419605 2023-01-22 18:22:40.359254: step: 1748/530, loss: 0.034647706896066666 2023-01-22 18:22:41.422772: step: 1752/530, loss: 0.0018340562237426639 2023-01-22 18:22:42.538837: step: 1756/530, loss: 0.0011087298626080155 2023-01-22 18:22:43.641948: step: 1760/530, loss: 0.0002733748988248408 2023-01-22 18:22:44.734172: step: 1764/530, loss: 0.0025841135066002607 2023-01-22 18:22:45.836909: step: 1768/530, loss: 0.0015732855536043644 2023-01-22 18:22:46.945926: step: 1772/530, loss: 0.0037623767275363207 2023-01-22 18:22:48.041701: step: 1776/530, loss: 0.0034943281207233667 2023-01-22 18:22:49.137062: step: 1780/530, loss: 0.024733854457736015 2023-01-22 18:22:50.234238: step: 1784/530, loss: 0.0025741488207131624 2023-01-22 18:22:51.337898: step: 1788/530, loss: 0.020954806357622147 2023-01-22 18:22:52.442137: step: 1792/530, loss: 0.012817895971238613 2023-01-22 18:22:53.527643: step: 1796/530, loss: 0.012562660500407219 2023-01-22 18:22:54.609173: step: 1800/530, loss: 0.00377222360111773 2023-01-22 18:22:55.723790: step: 1804/530, loss: 0.0007697981200180948 2023-01-22 18:22:56.822552: step: 1808/530, loss: 0.02762249857187271 2023-01-22 18:22:57.916121: step: 1812/530, loss: 0.03712872788310051 2023-01-22 18:22:58.998730: step: 1816/530, loss: 0.0036480992566794157 2023-01-22 18:23:00.088130: step: 1820/530, loss: 0.004068395588546991 2023-01-22 18:23:01.165641: step: 1824/530, loss: 0.005120148882269859 2023-01-22 18:23:02.259535: step: 1828/530, loss: 0.004024632275104523 2023-01-22 18:23:03.349509: step: 1832/530, loss: 0.029572544619441032 2023-01-22 18:23:04.447429: step: 1836/530, loss: 0.06368596106767654 2023-01-22 18:23:05.538772: step: 1840/530, loss: 0.020419303327798843 2023-01-22 18:23:06.618603: step: 1844/530, loss: 0.006639654282480478 2023-01-22 18:23:07.712060: step: 1848/530, loss: 0.010417046956717968 2023-01-22 18:23:08.803088: step: 1852/530, loss: 0.011444559320807457 2023-01-22 18:23:09.890999: step: 1856/530, loss: 0.0020195627585053444 2023-01-22 18:23:11.001884: step: 1860/530, loss: 0.005016625858843327 2023-01-22 18:23:12.127459: step: 1864/530, loss: 0.008337307721376419 2023-01-22 18:23:13.230728: step: 1868/530, loss: 0.003666571108624339 2023-01-22 18:23:14.310131: step: 1872/530, loss: 0.0020980502013117075 2023-01-22 18:23:15.406960: step: 1876/530, loss: 0.0034470376558601856 2023-01-22 18:23:16.506416: step: 1880/530, loss: 0.005727291107177734 2023-01-22 18:23:17.595289: step: 1884/530, loss: 0.0020817650947719812 2023-01-22 18:23:18.683157: step: 1888/530, loss: 0.004460801370441914 2023-01-22 18:23:19.782390: step: 1892/530, loss: 0.0016281689750030637 2023-01-22 18:23:20.870967: step: 1896/530, loss: 0.006343192420899868 2023-01-22 18:23:21.980872: step: 1900/530, loss: 0.009423536248505116 2023-01-22 18:23:23.071151: step: 1904/530, loss: 0.008155460469424725 2023-01-22 18:23:24.162940: step: 1908/530, loss: 0.003949078265577555 2023-01-22 18:23:25.272081: step: 1912/530, loss: 0.0037763582076877356 2023-01-22 18:23:26.397481: step: 1916/530, loss: 0.0035387608222663403 2023-01-22 18:23:27.526913: step: 1920/530, loss: 0.013976875692605972 2023-01-22 18:23:28.607615: step: 1924/530, loss: 0.0010418662568554282 2023-01-22 18:23:29.694016: step: 1928/530, loss: 0.002441958524286747 2023-01-22 18:23:30.789842: step: 1932/530, loss: 0.013802547939121723 2023-01-22 18:23:31.867825: step: 1936/530, loss: 0.00454210489988327 2023-01-22 18:23:32.942809: step: 1940/530, loss: 0.00550570385530591 2023-01-22 18:23:34.046086: step: 1944/530, loss: 0.002162436256185174 2023-01-22 18:23:35.156172: step: 1948/530, loss: 0.0331319198012352 2023-01-22 18:23:36.267064: step: 1952/530, loss: 0.004887016490101814 2023-01-22 18:23:37.352494: step: 1956/530, loss: 0.0003119751636404544 2023-01-22 18:23:38.465655: step: 1960/530, loss: 0.0023202712181955576 2023-01-22 18:23:39.540430: step: 1964/530, loss: 0.007336675655096769 2023-01-22 18:23:40.649255: step: 1968/530, loss: 0.0025362251326441765 2023-01-22 18:23:41.735200: step: 1972/530, loss: 0.0023483028635382652 2023-01-22 18:23:42.828318: step: 1976/530, loss: 0.007916290313005447 2023-01-22 18:23:43.918280: step: 1980/530, loss: 0.010539408773183823 2023-01-22 18:23:45.006255: step: 1984/530, loss: 0.005473783705383539 2023-01-22 18:23:46.109476: step: 1988/530, loss: 0.010434496216475964 2023-01-22 18:23:47.204523: step: 1992/530, loss: 0.010954899713397026 2023-01-22 18:23:48.289862: step: 1996/530, loss: 0.00786043331027031 2023-01-22 18:23:49.388579: step: 2000/530, loss: 0.004296116065233946 2023-01-22 18:23:50.479131: step: 2004/530, loss: 0.01646469719707966 2023-01-22 18:23:51.580475: step: 2008/530, loss: 0.0014695404097437859 2023-01-22 18:23:52.671480: step: 2012/530, loss: 0.0015034498646855354 2023-01-22 18:23:53.758961: step: 2016/530, loss: 0.01275192853063345 2023-01-22 18:23:54.837307: step: 2020/530, loss: 0.007414584513753653 2023-01-22 18:23:55.933526: step: 2024/530, loss: 0.007664314471185207 2023-01-22 18:23:57.026484: step: 2028/530, loss: 0.007140903268009424 2023-01-22 18:23:58.094608: step: 2032/530, loss: 0.0014236748684197664 2023-01-22 18:23:59.194705: step: 2036/530, loss: 0.0063665746711194515 2023-01-22 18:24:00.309767: step: 2040/530, loss: 0.0027392064221203327 2023-01-22 18:24:01.440358: step: 2044/530, loss: 0.005666750017553568 2023-01-22 18:24:02.529434: step: 2048/530, loss: 0.004224306438118219 2023-01-22 18:24:03.628941: step: 2052/530, loss: 0.0022075639571994543 2023-01-22 18:24:04.710554: step: 2056/530, loss: 0.006415753159672022 2023-01-22 18:24:05.801011: step: 2060/530, loss: 0.0028477220330387354 2023-01-22 18:24:06.900807: step: 2064/530, loss: 0.0012268719729036093 2023-01-22 18:24:07.988419: step: 2068/530, loss: 0.004640631843358278 2023-01-22 18:24:09.088471: step: 2072/530, loss: 0.007370230741798878 2023-01-22 18:24:10.200333: step: 2076/530, loss: 0.003632717300206423 2023-01-22 18:24:11.300833: step: 2080/530, loss: 0.0007659295806661248 2023-01-22 18:24:12.394790: step: 2084/530, loss: 0.0017630505608394742 2023-01-22 18:24:13.484607: step: 2088/530, loss: 0.011211691424250603 2023-01-22 18:24:14.580006: step: 2092/530, loss: 0.006302114110440016 2023-01-22 18:24:15.650010: step: 2096/530, loss: 0.0025455388240516186 2023-01-22 18:24:16.740181: step: 2100/530, loss: 0.008401133120059967 2023-01-22 18:24:17.802659: step: 2104/530, loss: 0.007786688860505819 2023-01-22 18:24:18.901168: step: 2108/530, loss: 0.002886673668399453 2023-01-22 18:24:19.990483: step: 2112/530, loss: 0.0017836429178714752 2023-01-22 18:24:21.074765: step: 2116/530, loss: 0.0034210775047540665 2023-01-22 18:24:22.144219: step: 2120/530, loss: 0.008159960620105267 ================================================== Loss: 0.010 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34010072445348244, 'r': 0.3626880590946056, 'f1': 0.3510314180768726}, 'combined': 0.25865472910927456, 'stategy': 1, 'epoch': 6} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3365448057195115, 'r': 0.28927540669659296, 'f1': 0.31112493209601644}, 'combined': 0.19322495782805232, 'stategy': 1, 'epoch': 6} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3501312439742484, 'r': 0.3474737013254875, 'f1': 0.34879741066387027}, 'combined': 0.2570086183839044, 'stategy': 1, 'epoch': 6} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.32076756427160497, 'r': 0.28808798057232177, 'f1': 0.30355075389121133}, 'combined': 0.1885209945219102, 'stategy': 1, 'epoch': 6} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 6} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 6} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} New best russian model... ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 7 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 18:27:04.034201: step: 4/530, loss: 0.00463224807754159 2023-01-22 18:27:05.116662: step: 8/530, loss: 0.001683820621110499 2023-01-22 18:27:06.203116: step: 12/530, loss: 0.003381364746019244 2023-01-22 18:27:07.287305: step: 16/530, loss: 0.0009808320319280028 2023-01-22 18:27:08.367480: step: 20/530, loss: 0.0026922153774648905 2023-01-22 18:27:09.465021: step: 24/530, loss: 0.036002252250909805 2023-01-22 18:27:10.545747: step: 28/530, loss: 0.006942289415746927 2023-01-22 18:27:11.629474: step: 32/530, loss: 0.004761753138154745 2023-01-22 18:27:12.719865: step: 36/530, loss: 0.002646166365593672 2023-01-22 18:27:13.817815: step: 40/530, loss: 0.0012257886119186878 2023-01-22 18:27:14.903880: step: 44/530, loss: 0.005338764283806086 2023-01-22 18:27:15.977476: step: 48/530, loss: 0.0012871178332716227 2023-01-22 18:27:17.085189: step: 52/530, loss: 0.02203054539859295 2023-01-22 18:27:18.203142: step: 56/530, loss: 0.03155577927827835 2023-01-22 18:27:19.311068: step: 60/530, loss: 0.010559890419244766 2023-01-22 18:27:20.402513: step: 64/530, loss: 0.01051109004765749 2023-01-22 18:27:21.506721: step: 68/530, loss: 0.006899889092892408 2023-01-22 18:27:22.612549: step: 72/530, loss: 0.01590123400092125 2023-01-22 18:27:23.729659: step: 76/530, loss: 0.006657039280980825 2023-01-22 18:27:24.847669: step: 80/530, loss: 0.006138589233160019 2023-01-22 18:27:25.938205: step: 84/530, loss: 0.03596678748726845 2023-01-22 18:27:27.026780: step: 88/530, loss: 0.006385402288287878 2023-01-22 18:27:28.099528: step: 92/530, loss: 0.006057546474039555 2023-01-22 18:27:29.197690: step: 96/530, loss: 0.0010628706077113748 2023-01-22 18:27:30.277339: step: 100/530, loss: 0.0029035129118710756 2023-01-22 18:27:31.365240: step: 104/530, loss: 0.0005100720445625484 2023-01-22 18:27:32.486717: step: 108/530, loss: 0.0023102881386876106 2023-01-22 18:27:33.588935: step: 112/530, loss: 0.0041152178309857845 2023-01-22 18:27:34.681169: step: 116/530, loss: 0.007752481382340193 2023-01-22 18:27:35.779742: step: 120/530, loss: 0.0008607989875599742 2023-01-22 18:27:36.860058: step: 124/530, loss: 0.014354175888001919 2023-01-22 18:27:37.965665: step: 128/530, loss: 0.026126377284526825 2023-01-22 18:27:39.039176: step: 132/530, loss: 0.07373518496751785 2023-01-22 18:27:40.130958: step: 136/530, loss: 0.0076378206722438335 2023-01-22 18:27:41.227944: step: 140/530, loss: 0.005049635656177998 2023-01-22 18:27:42.336309: step: 144/530, loss: 0.005359150003641844 2023-01-22 18:27:43.421608: step: 148/530, loss: 0.021733876317739487 2023-01-22 18:27:44.506667: step: 152/530, loss: 0.0019560488872230053 2023-01-22 18:27:45.619514: step: 156/530, loss: 0.022906986996531487 2023-01-22 18:27:46.714576: step: 160/530, loss: 0.00881852675229311 2023-01-22 18:27:47.804055: step: 164/530, loss: 0.002233170671388507 2023-01-22 18:27:48.892574: step: 168/530, loss: 0.0030977248679846525 2023-01-22 18:27:49.994414: step: 172/530, loss: 0.009406842291355133 2023-01-22 18:27:51.078569: step: 176/530, loss: 9.771555050974712e-05 2023-01-22 18:27:52.176534: step: 180/530, loss: 0.0023808307014405727 2023-01-22 18:27:53.308164: step: 184/530, loss: 0.004987532738596201 2023-01-22 18:27:54.396413: step: 188/530, loss: 0.0067310575395822525 2023-01-22 18:27:55.493440: step: 192/530, loss: 0.00045536665129475296 2023-01-22 18:27:56.582359: step: 196/530, loss: 0.010355474427342415 2023-01-22 18:27:57.688402: step: 200/530, loss: 0.008715576492249966 2023-01-22 18:27:58.797269: step: 204/530, loss: 0.008107380010187626 2023-01-22 18:27:59.893957: step: 208/530, loss: 0.0026640372816473246 2023-01-22 18:28:01.008155: step: 212/530, loss: 0.003948599100112915 2023-01-22 18:28:02.106007: step: 216/530, loss: 0.016453798860311508 2023-01-22 18:28:03.198663: step: 220/530, loss: 0.008649768307805061 2023-01-22 18:28:04.280583: step: 224/530, loss: 0.006488385144621134 2023-01-22 18:28:05.377036: step: 228/530, loss: 0.009495281614363194 2023-01-22 18:28:06.472448: step: 232/530, loss: 0.0019276264356449246 2023-01-22 18:28:07.569936: step: 236/530, loss: 0.004236297681927681 2023-01-22 18:28:08.689290: step: 240/530, loss: 0.0031727757304906845 2023-01-22 18:28:09.819141: step: 244/530, loss: 0.009979244321584702 2023-01-22 18:28:10.912001: step: 248/530, loss: 0.008907273411750793 2023-01-22 18:28:12.043361: step: 252/530, loss: 0.008175627328455448 2023-01-22 18:28:13.136691: step: 256/530, loss: 0.003716078121215105 2023-01-22 18:28:14.245410: step: 260/530, loss: 0.0030617089942097664 2023-01-22 18:28:15.344562: step: 264/530, loss: 0.0064925262704491615 2023-01-22 18:28:16.418951: step: 268/530, loss: 0.004499923903495073 2023-01-22 18:28:17.539587: step: 272/530, loss: 0.0027902901638299227 2023-01-22 18:28:18.651066: step: 276/530, loss: 0.0049284156411886215 2023-01-22 18:28:19.748299: step: 280/530, loss: 0.10972261428833008 2023-01-22 18:28:20.839656: step: 284/530, loss: 0.003794509917497635 2023-01-22 18:28:21.947792: step: 288/530, loss: 0.0058370851911604404 2023-01-22 18:28:23.056608: step: 292/530, loss: 0.002325585577636957 2023-01-22 18:28:24.156242: step: 296/530, loss: 0.016462258994579315 2023-01-22 18:28:25.264078: step: 300/530, loss: 0.0026082347612828016 2023-01-22 18:28:26.350963: step: 304/530, loss: 0.0001077714332495816 2023-01-22 18:28:27.468221: step: 308/530, loss: 0.00916716642677784 2023-01-22 18:28:28.559462: step: 312/530, loss: 0.0018658683402463794 2023-01-22 18:28:29.667425: step: 316/530, loss: 0.008952973410487175 2023-01-22 18:28:30.787867: step: 320/530, loss: 0.0031925092916935682 2023-01-22 18:28:31.876913: step: 324/530, loss: 0.002578672720119357 2023-01-22 18:28:32.987075: step: 328/530, loss: 0.012113017030060291 2023-01-22 18:28:34.093820: step: 332/530, loss: 0.015871243551373482 2023-01-22 18:28:35.197450: step: 336/530, loss: 0.003200849983841181 2023-01-22 18:28:36.285196: step: 340/530, loss: 0.0035453704185783863 2023-01-22 18:28:37.391517: step: 344/530, loss: 0.006059712264686823 2023-01-22 18:28:38.484825: step: 348/530, loss: 0.0014549053739756346 2023-01-22 18:28:39.569617: step: 352/530, loss: 0.0005033534835092723 2023-01-22 18:28:40.680416: step: 356/530, loss: 0.010503847151994705 2023-01-22 18:28:41.804162: step: 360/530, loss: 0.0006020868895575404 2023-01-22 18:28:42.912137: step: 364/530, loss: 0.025041157379746437 2023-01-22 18:28:43.997690: step: 368/530, loss: 0.00463578337803483 2023-01-22 18:28:45.093213: step: 372/530, loss: 0.00018186590750701725 2023-01-22 18:28:46.213951: step: 376/530, loss: 0.010330156423151493 2023-01-22 18:28:47.367862: step: 380/530, loss: 0.042303700000047684 2023-01-22 18:28:48.474453: step: 384/530, loss: 0.005308076739311218 2023-01-22 18:28:49.621499: step: 388/530, loss: 0.003753856522962451 2023-01-22 18:28:50.727667: step: 392/530, loss: 0.005373753607273102 2023-01-22 18:28:51.822247: step: 396/530, loss: 0.004915583413094282 2023-01-22 18:28:52.907546: step: 400/530, loss: 0.005431151483207941 2023-01-22 18:28:54.008733: step: 404/530, loss: 0.034240443259477615 2023-01-22 18:28:55.114348: step: 408/530, loss: 0.004481774754822254 2023-01-22 18:28:56.217708: step: 412/530, loss: 0.004229320213198662 2023-01-22 18:28:57.308720: step: 416/530, loss: 0.027343405410647392 2023-01-22 18:28:58.410340: step: 420/530, loss: 0.009248564019799232 2023-01-22 18:28:59.528601: step: 424/530, loss: 0.005732208490371704 2023-01-22 18:29:00.635567: step: 428/530, loss: 0.00029404659289866686 2023-01-22 18:29:01.744094: step: 432/530, loss: 0.012223182246088982 2023-01-22 18:29:02.832440: step: 436/530, loss: 0.0030045306775718927 2023-01-22 18:29:03.930695: step: 440/530, loss: 0.004541632253676653 2023-01-22 18:29:05.051325: step: 444/530, loss: 0.025317862629890442 2023-01-22 18:29:06.166613: step: 448/530, loss: 0.006078396458178759 2023-01-22 18:29:07.264697: step: 452/530, loss: 0.005915583577007055 2023-01-22 18:29:08.373612: step: 456/530, loss: 0.008833033964037895 2023-01-22 18:29:09.472897: step: 460/530, loss: 0.001243118429556489 2023-01-22 18:29:10.551286: step: 464/530, loss: 0.0015866317553445697 2023-01-22 18:29:11.639081: step: 468/530, loss: 0.00038922682870179415 2023-01-22 18:29:12.732930: step: 472/530, loss: 2.3639402570552193e-05 2023-01-22 18:29:13.830036: step: 476/530, loss: 0.01827951893210411 2023-01-22 18:29:14.919659: step: 480/530, loss: 0.002740520052611828 2023-01-22 18:29:16.012791: step: 484/530, loss: 0.012980856001377106 2023-01-22 18:29:17.115641: step: 488/530, loss: 0.003744292538613081 2023-01-22 18:29:18.225683: step: 492/530, loss: 0.008897952735424042 2023-01-22 18:29:19.319518: step: 496/530, loss: 0.017438406124711037 2023-01-22 18:29:20.419831: step: 500/530, loss: 0.015113581903278828 2023-01-22 18:29:21.521809: step: 504/530, loss: 0.0201431754976511 2023-01-22 18:29:22.621969: step: 508/530, loss: 0.0005575797986239195 2023-01-22 18:29:23.733696: step: 512/530, loss: 0.004977009259164333 2023-01-22 18:29:24.875866: step: 516/530, loss: 0.00013052007125224918 2023-01-22 18:29:25.983001: step: 520/530, loss: 0.010828935541212559 2023-01-22 18:29:27.076673: step: 524/530, loss: 0.003017609706148505 2023-01-22 18:29:28.179035: step: 528/530, loss: 0.11536585539579391 2023-01-22 18:29:29.289171: step: 532/530, loss: 0.0012215098831802607 2023-01-22 18:29:30.407964: step: 536/530, loss: 0.004368349444121122 2023-01-22 18:29:31.504292: step: 540/530, loss: 0.00455597136169672 2023-01-22 18:29:32.629709: step: 544/530, loss: 0.015852967277169228 2023-01-22 18:29:33.748996: step: 548/530, loss: 0.0013160236412659287 2023-01-22 18:29:34.853182: step: 552/530, loss: 0.008815168403089046 2023-01-22 18:29:35.968638: step: 556/530, loss: 0.04347842186689377 2023-01-22 18:29:37.076195: step: 560/530, loss: 0.06092775613069534 2023-01-22 18:29:38.159755: step: 564/530, loss: 0.0027884505689144135 2023-01-22 18:29:39.275143: step: 568/530, loss: 0.0013436584267765284 2023-01-22 18:29:40.366933: step: 572/530, loss: 0.0016177746001631021 2023-01-22 18:29:41.463234: step: 576/530, loss: 0.026669178158044815 2023-01-22 18:29:42.558045: step: 580/530, loss: 0.00439387047663331 2023-01-22 18:29:43.675296: step: 584/530, loss: 0.002781476126983762 2023-01-22 18:29:44.757741: step: 588/530, loss: 0.009298130869865417 2023-01-22 18:29:45.864456: step: 592/530, loss: 0.0022303471341729164 2023-01-22 18:29:46.955610: step: 596/530, loss: 0.01920304261147976 2023-01-22 18:29:48.068164: step: 600/530, loss: 0.01152800489217043 2023-01-22 18:29:49.163102: step: 604/530, loss: 0.0010703217703849077 2023-01-22 18:29:50.271032: step: 608/530, loss: 0.006187962368130684 2023-01-22 18:29:51.377180: step: 612/530, loss: 0.025365499779582024 2023-01-22 18:29:52.477827: step: 616/530, loss: 0.001042837044224143 2023-01-22 18:29:53.568583: step: 620/530, loss: 0.018153347074985504 2023-01-22 18:29:54.677228: step: 624/530, loss: 0.0028189036529511213 2023-01-22 18:29:55.775394: step: 628/530, loss: 0.031228696927428246 2023-01-22 18:29:56.865048: step: 632/530, loss: 0.004321316722780466 2023-01-22 18:29:57.963425: step: 636/530, loss: 0.0039545269683003426 2023-01-22 18:29:59.084672: step: 640/530, loss: 0.008419704623520374 2023-01-22 18:30:00.204394: step: 644/530, loss: 0.023659128695726395 2023-01-22 18:30:01.294713: step: 648/530, loss: 0.006105189677327871 2023-01-22 18:30:02.374109: step: 652/530, loss: 0.004462653771042824 2023-01-22 18:30:03.482829: step: 656/530, loss: 0.014436847530305386 2023-01-22 18:30:04.595236: step: 660/530, loss: 0.0004893246805295348 2023-01-22 18:30:05.721845: step: 664/530, loss: 0.011037465184926987 2023-01-22 18:30:06.802200: step: 668/530, loss: 0.007631612475961447 2023-01-22 18:30:07.906574: step: 672/530, loss: 0.0025377729907631874 2023-01-22 18:30:09.017292: step: 676/530, loss: 0.007415556348860264 2023-01-22 18:30:10.098139: step: 680/530, loss: 0.00011127939069410786 2023-01-22 18:30:11.181907: step: 684/530, loss: 0.003199041122570634 2023-01-22 18:30:12.299988: step: 688/530, loss: 0.007297462783753872 2023-01-22 18:30:13.380454: step: 692/530, loss: 0.002811875194311142 2023-01-22 18:30:14.474184: step: 696/530, loss: 0.01668676547706127 2023-01-22 18:30:15.568299: step: 700/530, loss: 0.00025425234343856573 2023-01-22 18:30:16.654951: step: 704/530, loss: 0.00702581275254488 2023-01-22 18:30:17.765741: step: 708/530, loss: 0.00665396498516202 2023-01-22 18:30:18.893738: step: 712/530, loss: 0.004290307871997356 2023-01-22 18:30:20.001268: step: 716/530, loss: 0.006105480715632439 2023-01-22 18:30:21.098825: step: 720/530, loss: 0.0017243979964405298 2023-01-22 18:30:22.205734: step: 724/530, loss: 0.00618281913921237 2023-01-22 18:30:23.296575: step: 728/530, loss: 0.00036540484870783985 2023-01-22 18:30:24.386332: step: 732/530, loss: 0.018587326630949974 2023-01-22 18:30:25.492282: step: 736/530, loss: 0.01968672312796116 2023-01-22 18:30:26.621039: step: 740/530, loss: 0.00969591736793518 2023-01-22 18:30:27.725867: step: 744/530, loss: 0.018504971638321877 2023-01-22 18:30:28.836660: step: 748/530, loss: 0.003154666628688574 2023-01-22 18:30:29.935834: step: 752/530, loss: 0.0071092708967626095 2023-01-22 18:30:31.039012: step: 756/530, loss: 0.010406233370304108 2023-01-22 18:30:32.146019: step: 760/530, loss: 0.004511485807597637 2023-01-22 18:30:33.243280: step: 764/530, loss: 0.007421662099659443 2023-01-22 18:30:34.330185: step: 768/530, loss: 0.0016526951221749187 2023-01-22 18:30:35.422081: step: 772/530, loss: 0.0009398804395459592 2023-01-22 18:30:36.540979: step: 776/530, loss: 0.002562194596976042 2023-01-22 18:30:37.650758: step: 780/530, loss: 0.0023031991440802813 2023-01-22 18:30:38.733084: step: 784/530, loss: 0.00508621521294117 2023-01-22 18:30:39.827500: step: 788/530, loss: 0.017179515212774277 2023-01-22 18:30:40.936603: step: 792/530, loss: 0.004915738943964243 2023-01-22 18:30:42.044926: step: 796/530, loss: 0.0069856238551437855 2023-01-22 18:30:43.131637: step: 800/530, loss: 0.004629735369235277 2023-01-22 18:30:44.241267: step: 804/530, loss: 0.009691477753221989 2023-01-22 18:30:45.330230: step: 808/530, loss: 0.0017027984140440822 2023-01-22 18:30:46.426016: step: 812/530, loss: 0.002548523712903261 2023-01-22 18:30:47.520780: step: 816/530, loss: 0.005001395009458065 2023-01-22 18:30:48.644964: step: 820/530, loss: 0.006331135518848896 2023-01-22 18:30:49.753729: step: 824/530, loss: 0.010274523869156837 2023-01-22 18:30:50.846760: step: 828/530, loss: 0.009996467269957066 2023-01-22 18:30:51.933904: step: 832/530, loss: 0.0075516668148338795 2023-01-22 18:30:53.056614: step: 836/530, loss: 0.03111538477241993 2023-01-22 18:30:54.146371: step: 840/530, loss: 0.011280653066933155 2023-01-22 18:30:55.264742: step: 844/530, loss: 0.0026294696144759655 2023-01-22 18:30:56.403584: step: 848/530, loss: 0.003596894210204482 2023-01-22 18:30:57.504503: step: 852/530, loss: 0.022199522703886032 2023-01-22 18:30:58.583751: step: 856/530, loss: 0.005757243372499943 2023-01-22 18:30:59.698513: step: 860/530, loss: 0.012366288341581821 2023-01-22 18:31:00.816104: step: 864/530, loss: 0.0072590867057442665 2023-01-22 18:31:01.905330: step: 868/530, loss: 0.005211768206208944 2023-01-22 18:31:02.996555: step: 872/530, loss: 0.0007780153537169099 2023-01-22 18:31:04.106152: step: 876/530, loss: 0.006579045671969652 2023-01-22 18:31:05.192966: step: 880/530, loss: 0.00034035538556054235 2023-01-22 18:31:06.310851: step: 884/530, loss: 0.020639551803469658 2023-01-22 18:31:07.417366: step: 888/530, loss: 0.009564299136400223 2023-01-22 18:31:08.534379: step: 892/530, loss: 0.012995216995477676 2023-01-22 18:31:09.642671: step: 896/530, loss: 0.0038737058639526367 2023-01-22 18:31:10.733218: step: 900/530, loss: 0.004532379563897848 2023-01-22 18:31:11.868219: step: 904/530, loss: 0.009280158206820488 2023-01-22 18:31:12.975613: step: 908/530, loss: 0.0004263847367838025 2023-01-22 18:31:14.085809: step: 912/530, loss: 0.009736970998346806 2023-01-22 18:31:15.179123: step: 916/530, loss: 0.004490819294005632 2023-01-22 18:31:16.272469: step: 920/530, loss: 0.004912327975034714 2023-01-22 18:31:17.411040: step: 924/530, loss: 0.005350144580006599 2023-01-22 18:31:18.494531: step: 928/530, loss: 0.016704106703400612 2023-01-22 18:31:19.586533: step: 932/530, loss: 0.002201124094426632 2023-01-22 18:31:20.692987: step: 936/530, loss: 0.005016628187149763 2023-01-22 18:31:21.779310: step: 940/530, loss: 0.003153557190671563 2023-01-22 18:31:22.833614: step: 944/530, loss: 0.02185557782649994 2023-01-22 18:31:23.946658: step: 948/530, loss: 0.004187334794551134 2023-01-22 18:31:25.058790: step: 952/530, loss: 0.008498439565300941 2023-01-22 18:31:26.153772: step: 956/530, loss: 0.016587520018219948 2023-01-22 18:31:27.265204: step: 960/530, loss: 0.008890247903764248 2023-01-22 18:31:28.400394: step: 964/530, loss: 0.03038751147687435 2023-01-22 18:31:29.482203: step: 968/530, loss: 0.009932409040629864 2023-01-22 18:31:30.581994: step: 972/530, loss: 9.147833225142676e-06 2023-01-22 18:31:31.681367: step: 976/530, loss: 0.001971217803657055 2023-01-22 18:31:32.768394: step: 980/530, loss: 0.002326179528608918 2023-01-22 18:31:33.866718: step: 984/530, loss: 0.005505596753209829 2023-01-22 18:31:34.976757: step: 988/530, loss: 0.02590414695441723 2023-01-22 18:31:36.083668: step: 992/530, loss: 0.00020978087559342384 2023-01-22 18:31:37.183453: step: 996/530, loss: 0.011213100515305996 2023-01-22 18:31:38.299203: step: 1000/530, loss: 0.026498788967728615 2023-01-22 18:31:39.407766: step: 1004/530, loss: 0.003575400449335575 2023-01-22 18:31:40.542545: step: 1008/530, loss: 0.00878897961229086 2023-01-22 18:31:41.639552: step: 1012/530, loss: 0.004244158510118723 2023-01-22 18:31:42.741221: step: 1016/530, loss: 0.0026787789538502693 2023-01-22 18:31:43.838063: step: 1020/530, loss: 0.007764363661408424 2023-01-22 18:31:44.929338: step: 1024/530, loss: 0.0011498505482450128 2023-01-22 18:31:46.046636: step: 1028/530, loss: 0.002127460204064846 2023-01-22 18:31:47.149527: step: 1032/530, loss: 0.0024901870638132095 2023-01-22 18:31:48.249996: step: 1036/530, loss: 0.0077363974414765835 2023-01-22 18:31:49.337475: step: 1040/530, loss: 0.004087755922228098 2023-01-22 18:31:50.441931: step: 1044/530, loss: 0.010710582137107849 2023-01-22 18:31:51.531484: step: 1048/530, loss: 0.000266395159997046 2023-01-22 18:31:52.657928: step: 1052/530, loss: 0.005906963255256414 2023-01-22 18:31:53.758060: step: 1056/530, loss: 0.003952084109187126 2023-01-22 18:31:54.845729: step: 1060/530, loss: 0.0019199763191863894 2023-01-22 18:31:55.948274: step: 1064/530, loss: 0.004333644639700651 2023-01-22 18:31:57.046406: step: 1068/530, loss: 0.0038385805673897266 2023-01-22 18:31:58.151824: step: 1072/530, loss: 0.002833553357049823 2023-01-22 18:31:59.272361: step: 1076/530, loss: 0.005803776439279318 2023-01-22 18:32:00.380114: step: 1080/530, loss: 0.006797958631068468 2023-01-22 18:32:01.525800: step: 1084/530, loss: 0.008882487192749977 2023-01-22 18:32:02.672891: step: 1088/530, loss: 0.005546614062041044 2023-01-22 18:32:03.773200: step: 1092/530, loss: 0.007498566061258316 2023-01-22 18:32:04.870844: step: 1096/530, loss: 0.005331460852175951 2023-01-22 18:32:05.969412: step: 1100/530, loss: 0.004108885303139687 2023-01-22 18:32:07.065739: step: 1104/530, loss: 0.013274230994284153 2023-01-22 18:32:08.159229: step: 1108/530, loss: 0.001495203236117959 2023-01-22 18:32:09.294504: step: 1112/530, loss: 0.0014030119637027383 2023-01-22 18:32:10.388742: step: 1116/530, loss: 0.0009595714509487152 2023-01-22 18:32:11.489790: step: 1120/530, loss: 0.004312857985496521 2023-01-22 18:32:12.585826: step: 1124/530, loss: 0.002902315929532051 2023-01-22 18:32:13.672328: step: 1128/530, loss: 0.0015837440732866526 2023-01-22 18:32:14.760212: step: 1132/530, loss: 0.0006025604670867324 2023-01-22 18:32:15.834450: step: 1136/530, loss: 0.008249369449913502 2023-01-22 18:32:16.931451: step: 1140/530, loss: 0.008096471428871155 2023-01-22 18:32:18.037573: step: 1144/530, loss: 0.007233277428895235 2023-01-22 18:32:19.152709: step: 1148/530, loss: 0.0013244193978607655 2023-01-22 18:32:20.272354: step: 1152/530, loss: 0.003945418167859316 2023-01-22 18:32:21.398898: step: 1156/530, loss: 0.010840107686817646 2023-01-22 18:32:22.505418: step: 1160/530, loss: 0.0009566234075464308 2023-01-22 18:32:23.619795: step: 1164/530, loss: 0.004920309409499168 2023-01-22 18:32:24.728676: step: 1168/530, loss: 0.0018896886613219976 2023-01-22 18:32:25.840435: step: 1172/530, loss: 0.0015820706030353904 2023-01-22 18:32:26.960226: step: 1176/530, loss: 0.0010488731786608696 2023-01-22 18:32:28.056535: step: 1180/530, loss: 0.0010845185024663806 2023-01-22 18:32:29.166969: step: 1184/530, loss: 0.0032175439409911633 2023-01-22 18:32:30.268931: step: 1188/530, loss: 0.024632660672068596 2023-01-22 18:32:31.370168: step: 1192/530, loss: 0.0041234660893678665 2023-01-22 18:32:32.472260: step: 1196/530, loss: 0.0017406868282705545 2023-01-22 18:32:33.586700: step: 1200/530, loss: 0.0026537885423749685 2023-01-22 18:32:34.698879: step: 1204/530, loss: 0.01513298787176609 2023-01-22 18:32:35.799049: step: 1208/530, loss: 0.008798873983323574 2023-01-22 18:32:36.967342: step: 1212/530, loss: 0.004736314062029123 2023-01-22 18:32:38.061733: step: 1216/530, loss: 0.005063324701040983 2023-01-22 18:32:39.149975: step: 1220/530, loss: 0.001203644904308021 2023-01-22 18:32:40.272610: step: 1224/530, loss: 0.004585994407534599 2023-01-22 18:32:41.365885: step: 1228/530, loss: 0.005031667649745941 2023-01-22 18:32:42.459102: step: 1232/530, loss: 0.00317892013117671 2023-01-22 18:32:43.546377: step: 1236/530, loss: 0.0048159826546907425 2023-01-22 18:32:44.645514: step: 1240/530, loss: 0.002159917028620839 2023-01-22 18:32:45.724758: step: 1244/530, loss: 0.0027185932267457247 2023-01-22 18:32:46.842027: step: 1248/530, loss: 0.0073392740450799465 2023-01-22 18:32:47.926783: step: 1252/530, loss: 0.0010658196406438947 2023-01-22 18:32:49.027987: step: 1256/530, loss: 7.896054012235254e-05 2023-01-22 18:32:50.142823: step: 1260/530, loss: 0.010328765027225018 2023-01-22 18:32:51.218850: step: 1264/530, loss: 0.0020433415193110704 2023-01-22 18:32:52.321354: step: 1268/530, loss: 0.006494658067822456 2023-01-22 18:32:53.429099: step: 1272/530, loss: 0.004773708060383797 2023-01-22 18:32:54.507568: step: 1276/530, loss: 0.003112129168584943 2023-01-22 18:32:55.609831: step: 1280/530, loss: 0.0249512679874897 2023-01-22 18:32:56.709723: step: 1284/530, loss: 0.0022350058425217867 2023-01-22 18:32:57.810990: step: 1288/530, loss: 0.007941442541778088 2023-01-22 18:32:58.905111: step: 1292/530, loss: 0.004541994538158178 2023-01-22 18:33:00.024655: step: 1296/530, loss: 0.013734852895140648 2023-01-22 18:33:01.166284: step: 1300/530, loss: 0.008403218351304531 2023-01-22 18:33:02.274098: step: 1304/530, loss: 0.004030571319162846 2023-01-22 18:33:03.385308: step: 1308/530, loss: 0.00379652320407331 2023-01-22 18:33:04.487968: step: 1312/530, loss: 0.00011982818250544369 2023-01-22 18:33:05.589926: step: 1316/530, loss: 0.007124029099941254 2023-01-22 18:33:06.690432: step: 1320/530, loss: 0.0036713359877467155 2023-01-22 18:33:07.780056: step: 1324/530, loss: 0.0042560407891869545 2023-01-22 18:33:08.879629: step: 1328/530, loss: 0.0016115898033604026 2023-01-22 18:33:09.968737: step: 1332/530, loss: 0.00369810382835567 2023-01-22 18:33:11.072714: step: 1336/530, loss: 5.417061038315296e-05 2023-01-22 18:33:12.162906: step: 1340/530, loss: 0.013022118248045444 2023-01-22 18:33:13.255604: step: 1344/530, loss: 0.008205000311136246 2023-01-22 18:33:14.356371: step: 1348/530, loss: 0.0024616713635623455 2023-01-22 18:33:15.446410: step: 1352/530, loss: 0.015581676736474037 2023-01-22 18:33:16.554336: step: 1356/530, loss: 0.005608633626252413 2023-01-22 18:33:17.673172: step: 1360/530, loss: 0.0017849968280643225 2023-01-22 18:33:18.756373: step: 1364/530, loss: 0.001441963016986847 2023-01-22 18:33:19.844185: step: 1368/530, loss: 0.0038278549909591675 2023-01-22 18:33:20.941967: step: 1372/530, loss: 0.01854427345097065 2023-01-22 18:33:22.029125: step: 1376/530, loss: 0.002111167646944523 2023-01-22 18:33:23.155536: step: 1380/530, loss: 0.017942290753126144 2023-01-22 18:33:24.270941: step: 1384/530, loss: 0.004350887145847082 2023-01-22 18:33:25.378207: step: 1388/530, loss: 0.001139622530899942 2023-01-22 18:33:26.470135: step: 1392/530, loss: 0.0 2023-01-22 18:33:27.562580: step: 1396/530, loss: 0.00782643910497427 2023-01-22 18:33:28.663378: step: 1400/530, loss: 0.003277075942605734 2023-01-22 18:33:29.752815: step: 1404/530, loss: 0.006889357231557369 2023-01-22 18:33:30.848076: step: 1408/530, loss: 0.0027386583387851715 2023-01-22 18:33:31.966025: step: 1412/530, loss: 0.006297572050243616 2023-01-22 18:33:33.068220: step: 1416/530, loss: 0.0002503152936697006 2023-01-22 18:33:34.195474: step: 1420/530, loss: 0.007495633326470852 2023-01-22 18:33:35.290831: step: 1424/530, loss: 0.0046742577105760574 2023-01-22 18:33:36.404954: step: 1428/530, loss: 0.00758227938786149 2023-01-22 18:33:37.500075: step: 1432/530, loss: 0.003613221226260066 2023-01-22 18:33:38.635677: step: 1436/530, loss: 0.016247134655714035 2023-01-22 18:33:39.755009: step: 1440/530, loss: 0.003686268115416169 2023-01-22 18:33:40.835736: step: 1444/530, loss: 0.004092773888260126 2023-01-22 18:33:41.946200: step: 1448/530, loss: 0.0029255282133817673 2023-01-22 18:33:43.072637: step: 1452/530, loss: 0.026645731180906296 2023-01-22 18:33:44.195045: step: 1456/530, loss: 0.010394490323960781 2023-01-22 18:33:45.308638: step: 1460/530, loss: 0.004966864828020334 2023-01-22 18:33:46.393880: step: 1464/530, loss: 0.006544764619320631 2023-01-22 18:33:47.492640: step: 1468/530, loss: 0.02776217833161354 2023-01-22 18:33:48.600786: step: 1472/530, loss: 0.0045127058401703835 2023-01-22 18:33:49.706218: step: 1476/530, loss: 0.0007814022828824818 2023-01-22 18:33:50.803429: step: 1480/530, loss: 0.0019984205719083548 2023-01-22 18:33:51.905303: step: 1484/530, loss: 0.03594312071800232 2023-01-22 18:33:53.006424: step: 1488/530, loss: 0.0011367242550477386 2023-01-22 18:33:54.111913: step: 1492/530, loss: 0.01858605444431305 2023-01-22 18:33:55.194103: step: 1496/530, loss: 0.012442837469279766 2023-01-22 18:33:56.288787: step: 1500/530, loss: 0.054779428988695145 2023-01-22 18:33:57.402372: step: 1504/530, loss: 0.004249508958309889 2023-01-22 18:33:58.530214: step: 1508/530, loss: 0.006845967844128609 2023-01-22 18:33:59.640977: step: 1512/530, loss: 0.021029451861977577 2023-01-22 18:34:00.742904: step: 1516/530, loss: 0.002162677003070712 2023-01-22 18:34:01.846267: step: 1520/530, loss: 0.004090449772775173 2023-01-22 18:34:02.938876: step: 1524/530, loss: 0.006330376490950584 2023-01-22 18:34:04.022149: step: 1528/530, loss: 0.0016081409994512796 2023-01-22 18:34:05.128486: step: 1532/530, loss: 0.0043511539697647095 2023-01-22 18:34:06.223878: step: 1536/530, loss: 0.005677711218595505 2023-01-22 18:34:07.339622: step: 1540/530, loss: 0.036507170647382736 2023-01-22 18:34:08.423117: step: 1544/530, loss: 0.0038570270407944918 2023-01-22 18:34:09.503744: step: 1548/530, loss: 0.006900971755385399 2023-01-22 18:34:10.621531: step: 1552/530, loss: 0.008843934163451195 2023-01-22 18:34:11.743641: step: 1556/530, loss: 0.0018246282124891877 2023-01-22 18:34:12.849569: step: 1560/530, loss: 0.001417941297404468 2023-01-22 18:34:13.950602: step: 1564/530, loss: 0.03741540387272835 2023-01-22 18:34:15.042261: step: 1568/530, loss: 0.0013847595546394587 2023-01-22 18:34:16.141822: step: 1572/530, loss: 0.002411586930975318 2023-01-22 18:34:17.258743: step: 1576/530, loss: 0.008746135048568249 2023-01-22 18:34:18.354116: step: 1580/530, loss: 0.004413927439600229 2023-01-22 18:34:19.421222: step: 1584/530, loss: 0.005375355947762728 2023-01-22 18:34:20.514225: step: 1588/530, loss: 0.003987058997154236 2023-01-22 18:34:21.603741: step: 1592/530, loss: 0.0022512220311909914 2023-01-22 18:34:22.716135: step: 1596/530, loss: 0.00216246978379786 2023-01-22 18:34:23.817905: step: 1600/530, loss: 0.008033680729568005 2023-01-22 18:34:24.915529: step: 1604/530, loss: 0.00646651815623045 2023-01-22 18:34:26.011404: step: 1608/530, loss: 0.00499124638736248 2023-01-22 18:34:27.113652: step: 1612/530, loss: 0.00862337090075016 2023-01-22 18:34:28.194808: step: 1616/530, loss: 0.00017277048027608544 2023-01-22 18:34:29.302704: step: 1620/530, loss: 0.0036424994468688965 2023-01-22 18:34:30.400300: step: 1624/530, loss: 0.002481953240931034 2023-01-22 18:34:31.492686: step: 1628/530, loss: 0.000285786809399724 2023-01-22 18:34:32.586647: step: 1632/530, loss: 0.0014721582410857081 2023-01-22 18:34:33.683776: step: 1636/530, loss: 0.003251965157687664 2023-01-22 18:34:34.783567: step: 1640/530, loss: 0.03291851654648781 2023-01-22 18:34:35.865318: step: 1644/530, loss: 0.015224786475300789 2023-01-22 18:34:36.951753: step: 1648/530, loss: 0.002789664315059781 2023-01-22 18:34:38.058667: step: 1652/530, loss: 0.024261346086859703 2023-01-22 18:34:39.166045: step: 1656/530, loss: 0.0007601691759191453 2023-01-22 18:34:40.275678: step: 1660/530, loss: 0.0020782810170203447 2023-01-22 18:34:41.382756: step: 1664/530, loss: 0.005972633603960276 2023-01-22 18:34:42.481577: step: 1668/530, loss: 0.007904973812401295 2023-01-22 18:34:43.577836: step: 1672/530, loss: 0.004683814011514187 2023-01-22 18:34:44.679343: step: 1676/530, loss: 0.009097536094486713 2023-01-22 18:34:45.778783: step: 1680/530, loss: 0.004008658230304718 2023-01-22 18:34:46.859150: step: 1684/530, loss: 0.010705480352044106 2023-01-22 18:34:47.953576: step: 1688/530, loss: 0.0031620340887457132 2023-01-22 18:34:49.048139: step: 1692/530, loss: 0.002292171586304903 2023-01-22 18:34:50.141362: step: 1696/530, loss: 0.0029696908313781023 2023-01-22 18:34:51.223582: step: 1700/530, loss: 9.170618432108313e-05 2023-01-22 18:34:52.318356: step: 1704/530, loss: 0.006824272219091654 2023-01-22 18:34:53.434181: step: 1708/530, loss: 0.002788491314277053 2023-01-22 18:34:54.538405: step: 1712/530, loss: 0.00028299755649641156 2023-01-22 18:34:55.634965: step: 1716/530, loss: 0.004729172680526972 2023-01-22 18:34:56.716037: step: 1720/530, loss: 0.00674403365701437 2023-01-22 18:34:57.809270: step: 1724/530, loss: 0.0005443753907456994 2023-01-22 18:34:58.885487: step: 1728/530, loss: 0.004042500630021095 2023-01-22 18:34:59.991827: step: 1732/530, loss: 0.004739298485219479 2023-01-22 18:35:01.112883: step: 1736/530, loss: 0.016698963940143585 2023-01-22 18:35:02.223842: step: 1740/530, loss: 0.004124755505472422 2023-01-22 18:35:03.342097: step: 1744/530, loss: 0.00602650735527277 2023-01-22 18:35:04.437358: step: 1748/530, loss: 0.0001949649304151535 2023-01-22 18:35:05.528512: step: 1752/530, loss: 0.00897810235619545 2023-01-22 18:35:06.599489: step: 1756/530, loss: 0.0002865359710995108 2023-01-22 18:35:07.684677: step: 1760/530, loss: 0.00449963565915823 2023-01-22 18:35:08.795211: step: 1764/530, loss: 0.0045041609555482864 2023-01-22 18:35:09.894241: step: 1768/530, loss: 0.0038851157296448946 2023-01-22 18:35:10.982706: step: 1772/530, loss: 0.001119268243201077 2023-01-22 18:35:12.086064: step: 1776/530, loss: 0.014574144035577774 2023-01-22 18:35:13.176872: step: 1780/530, loss: 0.004657109268009663 2023-01-22 18:35:14.274829: step: 1784/530, loss: 0.0025860783644020557 2023-01-22 18:35:15.402364: step: 1788/530, loss: 0.005173766054213047 2023-01-22 18:35:16.501833: step: 1792/530, loss: 0.006994450464844704 2023-01-22 18:35:17.597318: step: 1796/530, loss: 0.0030993837863206863 2023-01-22 18:35:18.690939: step: 1800/530, loss: 0.0024590729735791683 2023-01-22 18:35:19.789480: step: 1804/530, loss: 0.010682656429708004 2023-01-22 18:35:20.893633: step: 1808/530, loss: 0.06118054315447807 2023-01-22 18:35:22.014099: step: 1812/530, loss: 0.0007971552549861372 2023-01-22 18:35:23.115989: step: 1816/530, loss: 0.005168508272618055 2023-01-22 18:35:24.229621: step: 1820/530, loss: 0.0006055228295736015 2023-01-22 18:35:25.328967: step: 1824/530, loss: 0.007847760803997517 2023-01-22 18:35:26.418382: step: 1828/530, loss: 0.0027650182601064444 2023-01-22 18:35:27.500173: step: 1832/530, loss: 0.00246259942650795 2023-01-22 18:35:28.609224: step: 1836/530, loss: 0.0003299112431704998 2023-01-22 18:35:29.701675: step: 1840/530, loss: 0.00890478678047657 2023-01-22 18:35:30.782488: step: 1844/530, loss: 0.0010243532015010715 2023-01-22 18:35:31.874384: step: 1848/530, loss: 0.00031048664823174477 2023-01-22 18:35:32.964415: step: 1852/530, loss: 0.003606498474255204 2023-01-22 18:35:34.045565: step: 1856/530, loss: 0.004054786171764135 2023-01-22 18:35:35.128360: step: 1860/530, loss: 0.0001850359549280256 2023-01-22 18:35:36.221977: step: 1864/530, loss: 0.0033533195964992046 2023-01-22 18:35:37.317120: step: 1868/530, loss: 0.0033644381910562515 2023-01-22 18:35:38.434973: step: 1872/530, loss: 0.0031397216953337193 2023-01-22 18:35:39.520246: step: 1876/530, loss: 0.0056030941195786 2023-01-22 18:35:40.615081: step: 1880/530, loss: 0.008420975878834724 2023-01-22 18:35:41.743267: step: 1884/530, loss: 0.0031390476506203413 2023-01-22 18:35:42.829045: step: 1888/530, loss: 0.004058401565998793 2023-01-22 18:35:43.931337: step: 1892/530, loss: 0.018810905516147614 2023-01-22 18:35:45.014010: step: 1896/530, loss: 0.0017225093906745315 2023-01-22 18:35:46.095407: step: 1900/530, loss: 0.00015182253264356405 2023-01-22 18:35:47.210653: step: 1904/530, loss: 0.014628239907324314 2023-01-22 18:35:48.322521: step: 1908/530, loss: 0.007030069828033447 2023-01-22 18:35:49.445205: step: 1912/530, loss: 0.0039815884083509445 2023-01-22 18:35:50.529411: step: 1916/530, loss: 0.0031995372846722603 2023-01-22 18:35:51.627154: step: 1920/530, loss: 0.0021978002041578293 2023-01-22 18:35:52.728575: step: 1924/530, loss: 0.011598794721066952 2023-01-22 18:35:53.796829: step: 1928/530, loss: 1.3859623322787229e-05 2023-01-22 18:35:54.892913: step: 1932/530, loss: 0.005122246686369181 2023-01-22 18:35:55.997700: step: 1936/530, loss: 0.000861929205711931 2023-01-22 18:35:57.096979: step: 1940/530, loss: 0.0037842500023543835 2023-01-22 18:35:58.204967: step: 1944/530, loss: 0.024135509505867958 2023-01-22 18:35:59.333265: step: 1948/530, loss: 0.004512297920882702 2023-01-22 18:36:00.423719: step: 1952/530, loss: 0.007814999669790268 2023-01-22 18:36:01.527772: step: 1956/530, loss: 0.0035329656675457954 2023-01-22 18:36:02.634719: step: 1960/530, loss: 0.007976973429322243 2023-01-22 18:36:03.766762: step: 1964/530, loss: 0.0010328668868169188 2023-01-22 18:36:04.849379: step: 1968/530, loss: 0.005584979895502329 2023-01-22 18:36:05.957997: step: 1972/530, loss: 0.0035292149987071753 2023-01-22 18:36:07.049911: step: 1976/530, loss: 0.013540218584239483 2023-01-22 18:36:08.166423: step: 1980/530, loss: 0.053867876529693604 2023-01-22 18:36:09.260676: step: 1984/530, loss: 0.007585104554891586 2023-01-22 18:36:10.359853: step: 1988/530, loss: 0.00833124853670597 2023-01-22 18:36:11.457933: step: 1992/530, loss: 0.01000333670526743 2023-01-22 18:36:12.569288: step: 1996/530, loss: 0.009707452729344368 2023-01-22 18:36:13.669947: step: 2000/530, loss: 0.0010923369554802775 2023-01-22 18:36:14.776856: step: 2004/530, loss: 0.01993182860314846 2023-01-22 18:36:15.875049: step: 2008/530, loss: 0.005449749529361725 2023-01-22 18:36:16.983489: step: 2012/530, loss: 0.002692443085834384 2023-01-22 18:36:18.100555: step: 2016/530, loss: 0.004566051997244358 2023-01-22 18:36:19.183135: step: 2020/530, loss: 0.005283520091325045 2023-01-22 18:36:20.290901: step: 2024/530, loss: 0.013108435086905956 2023-01-22 18:36:21.405011: step: 2028/530, loss: 0.006936965975910425 2023-01-22 18:36:22.481459: step: 2032/530, loss: 5.192582466406748e-05 2023-01-22 18:36:23.601098: step: 2036/530, loss: 0.007226844783872366 2023-01-22 18:36:24.700196: step: 2040/530, loss: 0.0064369551837444305 2023-01-22 18:36:25.807648: step: 2044/530, loss: 0.0069593158550560474 2023-01-22 18:36:26.910953: step: 2048/530, loss: 0.00316441198810935 2023-01-22 18:36:28.004513: step: 2052/530, loss: 0.006536487024277449 2023-01-22 18:36:29.100581: step: 2056/530, loss: 0.007403606548905373 2023-01-22 18:36:30.191269: step: 2060/530, loss: 0.008399543352425098 2023-01-22 18:36:31.317836: step: 2064/530, loss: 0.0011779998894780874 2023-01-22 18:36:32.430268: step: 2068/530, loss: 0.0026249131187796593 2023-01-22 18:36:33.535794: step: 2072/530, loss: 0.012515190988779068 2023-01-22 18:36:34.625563: step: 2076/530, loss: 0.0011450749589130282 2023-01-22 18:36:35.728458: step: 2080/530, loss: 0.0004367369692772627 2023-01-22 18:36:36.833791: step: 2084/530, loss: 0.01260147150605917 2023-01-22 18:36:37.947503: step: 2088/530, loss: 0.0008949777111411095 2023-01-22 18:36:39.061456: step: 2092/530, loss: 0.002702175173908472 2023-01-22 18:36:40.144519: step: 2096/530, loss: 0.0007663618307560682 2023-01-22 18:36:41.255417: step: 2100/530, loss: 0.0 2023-01-22 18:36:42.364341: step: 2104/530, loss: 0.008782296441495419 2023-01-22 18:36:43.478775: step: 2108/530, loss: 0.00501541281118989 2023-01-22 18:36:44.568395: step: 2112/530, loss: 0.020943904295563698 2023-01-22 18:36:45.663541: step: 2116/530, loss: 0.0034575266763567924 2023-01-22 18:36:46.768171: step: 2120/530, loss: 0.0016149027505889535 ================================================== Loss: 0.008 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33933928571428573, 'r': 0.35414915966386556, 'f1': 0.34658608568775695}, 'combined': 0.2553792210330841, 'stategy': 1, 'epoch': 7} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33212666223409204, 'r': 0.2838352484374436, 'f1': 0.30608793191493916}, 'combined': 0.19009671561033065, 'stategy': 1, 'epoch': 7} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34964647290162165, 'r': 0.3403579517998708, 'f1': 0.34493969345871517}, 'combined': 0.254166089916948, 'stategy': 1, 'epoch': 7} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31974305221457255, 'r': 0.28685158096796964, 'f1': 0.30240557701628495}, 'combined': 0.18780977941011381, 'stategy': 1, 'epoch': 7} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34305908858973777, 'r': 0.32613397226462737, 'f1': 0.3343824968549779}, 'combined': 0.24638710294577318, 'stategy': 1, 'epoch': 7} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34803433338900086, 'r': 0.2968427088332643, 'f1': 0.3204066745318026}, 'combined': 0.19898940839343532, 'stategy': 1, 'epoch': 7} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 7} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.375, 'r': 0.5217391304347826, 'f1': 0.43636363636363634}, 'combined': 0.21818181818181817, 'stategy': 1, 'epoch': 7} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 7} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 8 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 18:39:17.305268: step: 4/530, loss: 0.007388156373053789 2023-01-22 18:39:18.389935: step: 8/530, loss: 0.0015344498679041862 2023-01-22 18:39:19.493914: step: 12/530, loss: 0.0018128934316337109 2023-01-22 18:39:20.586294: step: 16/530, loss: 0.009831286035478115 2023-01-22 18:39:21.709938: step: 20/530, loss: 0.007215637248009443 2023-01-22 18:39:22.805862: step: 24/530, loss: 0.014350504614412785 2023-01-22 18:39:23.921305: step: 28/530, loss: 0.0031574484892189503 2023-01-22 18:39:25.036614: step: 32/530, loss: 0.006929425522685051 2023-01-22 18:39:26.131168: step: 36/530, loss: 0.008028604090213776 2023-01-22 18:39:27.205299: step: 40/530, loss: 0.00025584796094335616 2023-01-22 18:39:28.261823: step: 44/530, loss: 0.00564237218350172 2023-01-22 18:39:29.351374: step: 48/530, loss: 0.007395686581730843 2023-01-22 18:39:30.471261: step: 52/530, loss: 0.008263861760497093 2023-01-22 18:39:31.591884: step: 56/530, loss: 0.004996147938072681 2023-01-22 18:39:32.670460: step: 60/530, loss: 0.0030164753552526236 2023-01-22 18:39:33.766937: step: 64/530, loss: 0.008622347377240658 2023-01-22 18:39:34.852600: step: 68/530, loss: 0.019499190151691437 2023-01-22 18:39:35.945092: step: 72/530, loss: 0.005495051387697458 2023-01-22 18:39:37.046808: step: 76/530, loss: 0.007131422404199839 2023-01-22 18:39:38.176448: step: 80/530, loss: 0.03309730067849159 2023-01-22 18:39:39.269665: step: 84/530, loss: 0.004485478159040213 2023-01-22 18:39:40.353764: step: 88/530, loss: 0.0018139644525945187 2023-01-22 18:39:41.444225: step: 92/530, loss: 0.0038743652403354645 2023-01-22 18:39:42.545993: step: 96/530, loss: 0.005034653469920158 2023-01-22 18:39:43.644355: step: 100/530, loss: 0.003150301519781351 2023-01-22 18:39:44.749628: step: 104/530, loss: 0.002994616748765111 2023-01-22 18:39:45.839926: step: 108/530, loss: 0.0015131353866308928 2023-01-22 18:39:46.936985: step: 112/530, loss: 0.016307523474097252 2023-01-22 18:39:48.043114: step: 116/530, loss: 0.0059173088520765305 2023-01-22 18:39:49.178474: step: 120/530, loss: 0.010499164462089539 2023-01-22 18:39:50.273610: step: 124/530, loss: 0.005338155198842287 2023-01-22 18:39:51.369981: step: 128/530, loss: 0.008071066811680794 2023-01-22 18:39:52.462831: step: 132/530, loss: 0.003561959834769368 2023-01-22 18:39:53.578583: step: 136/530, loss: 0.007174029015004635 2023-01-22 18:39:54.678094: step: 140/530, loss: 0.005008305888622999 2023-01-22 18:39:55.777540: step: 144/530, loss: 0.0001466915273340419 2023-01-22 18:39:56.888657: step: 148/530, loss: 0.008366018533706665 2023-01-22 18:39:57.980257: step: 152/530, loss: 0.026283252984285355 2023-01-22 18:39:59.093826: step: 156/530, loss: 0.009043721482157707 2023-01-22 18:40:00.213834: step: 160/530, loss: 0.008177349343895912 2023-01-22 18:40:01.337666: step: 164/530, loss: 0.0040166606195271015 2023-01-22 18:40:02.421421: step: 168/530, loss: 0.004817122593522072 2023-01-22 18:40:03.516208: step: 172/530, loss: 0.00043714369530789554 2023-01-22 18:40:04.602183: step: 176/530, loss: 0.0114826001226902 2023-01-22 18:40:05.718963: step: 180/530, loss: 0.0040775928646326065 2023-01-22 18:40:06.821912: step: 184/530, loss: 0.011558112688362598 2023-01-22 18:40:07.913762: step: 188/530, loss: 0.0068406532518565655 2023-01-22 18:40:08.999531: step: 192/530, loss: 0.020551558583974838 2023-01-22 18:40:10.092962: step: 196/530, loss: 0.001693563535809517 2023-01-22 18:40:11.190691: step: 200/530, loss: 0.06349463015794754 2023-01-22 18:40:12.310895: step: 204/530, loss: 0.01125803217291832 2023-01-22 18:40:13.413052: step: 208/530, loss: 0.0010764760663732886 2023-01-22 18:40:14.499285: step: 212/530, loss: 0.0006107440567575395 2023-01-22 18:40:15.583558: step: 216/530, loss: 0.0032729203812777996 2023-01-22 18:40:16.675312: step: 220/530, loss: 0.004097287077456713 2023-01-22 18:40:17.758062: step: 224/530, loss: 0.003067636862397194 2023-01-22 18:40:18.892130: step: 228/530, loss: 0.007797864731401205 2023-01-22 18:40:20.007892: step: 232/530, loss: 0.0007214655051939189 2023-01-22 18:40:21.095637: step: 236/530, loss: 0.0006559145986102521 2023-01-22 18:40:22.204810: step: 240/530, loss: 0.003197344485670328 2023-01-22 18:40:23.316449: step: 244/530, loss: 0.00365530326962471 2023-01-22 18:40:24.412604: step: 248/530, loss: 0.008429373614490032 2023-01-22 18:40:25.530787: step: 252/530, loss: 0.004971066489815712 2023-01-22 18:40:26.630554: step: 256/530, loss: 0.0021796892397105694 2023-01-22 18:40:27.742775: step: 260/530, loss: 0.004744360689073801 2023-01-22 18:40:28.847683: step: 264/530, loss: 0.0015998062444850802 2023-01-22 18:40:29.942800: step: 268/530, loss: 0.004553547594696283 2023-01-22 18:40:31.036774: step: 272/530, loss: 0.0014314936706796288 2023-01-22 18:40:32.145230: step: 276/530, loss: 0.004400314763188362 2023-01-22 18:40:33.282514: step: 280/530, loss: 0.012932044453918934 2023-01-22 18:40:34.401100: step: 284/530, loss: 0.0004229581099934876 2023-01-22 18:40:35.511927: step: 288/530, loss: 0.05883161351084709 2023-01-22 18:40:36.614159: step: 292/530, loss: 0.005640116985887289 2023-01-22 18:40:37.711531: step: 296/530, loss: 0.0003104460774920881 2023-01-22 18:40:38.806462: step: 300/530, loss: 0.0044784098863601685 2023-01-22 18:40:39.915751: step: 304/530, loss: 0.005911798216402531 2023-01-22 18:40:41.010949: step: 308/530, loss: 0.0025081285275518894 2023-01-22 18:40:42.096567: step: 312/530, loss: 0.0013118191855028272 2023-01-22 18:40:43.186130: step: 316/530, loss: 0.016062332317233086 2023-01-22 18:40:44.294777: step: 320/530, loss: 0.0030639884062111378 2023-01-22 18:40:45.435603: step: 324/530, loss: 0.005788047332316637 2023-01-22 18:40:46.558833: step: 328/530, loss: 0.003149400232359767 2023-01-22 18:40:47.650547: step: 332/530, loss: 0.005945851560682058 2023-01-22 18:40:48.776318: step: 336/530, loss: 0.002734619891270995 2023-01-22 18:40:49.857128: step: 340/530, loss: 0.0068957204930484295 2023-01-22 18:40:50.955750: step: 344/530, loss: 0.0010261823190376163 2023-01-22 18:40:52.038179: step: 348/530, loss: 0.0073088607750833035 2023-01-22 18:40:53.140944: step: 352/530, loss: 0.002897347556427121 2023-01-22 18:40:54.252916: step: 356/530, loss: 0.10373104363679886 2023-01-22 18:40:55.390364: step: 360/530, loss: 0.0011780316708609462 2023-01-22 18:40:56.486911: step: 364/530, loss: 0.00012777314987033606 2023-01-22 18:40:57.579543: step: 368/530, loss: 0.0021382318809628487 2023-01-22 18:40:58.687226: step: 372/530, loss: 0.003371322061866522 2023-01-22 18:40:59.793463: step: 376/530, loss: 0.0054047973826527596 2023-01-22 18:41:00.904131: step: 380/530, loss: 0.00026519360835663974 2023-01-22 18:41:02.010470: step: 384/530, loss: 0.006048600655049086 2023-01-22 18:41:03.096736: step: 388/530, loss: 0.0013884049840271473 2023-01-22 18:41:04.196659: step: 392/530, loss: 0.012104946188628674 2023-01-22 18:41:05.304344: step: 396/530, loss: 0.0038868628907948732 2023-01-22 18:41:06.403922: step: 400/530, loss: 0.005234112497419119 2023-01-22 18:41:07.504088: step: 404/530, loss: 0.008141560479998589 2023-01-22 18:41:08.575163: step: 408/530, loss: 4.81834695165162e-06 2023-01-22 18:41:09.661242: step: 412/530, loss: 0.0002958564436994493 2023-01-22 18:41:10.759000: step: 416/530, loss: 0.008125375024974346 2023-01-22 18:41:11.870341: step: 420/530, loss: 0.002929950598627329 2023-01-22 18:41:12.952083: step: 424/530, loss: 0.008882114663720131 2023-01-22 18:41:14.043844: step: 428/530, loss: 0.0013432524865493178 2023-01-22 18:41:15.160546: step: 432/530, loss: 0.0036510159261524677 2023-01-22 18:41:16.235192: step: 436/530, loss: 0.002689539222046733 2023-01-22 18:41:17.349510: step: 440/530, loss: 0.0008996232063509524 2023-01-22 18:41:18.463814: step: 444/530, loss: 0.0025219181552529335 2023-01-22 18:41:19.575613: step: 448/530, loss: 0.003783931490033865 2023-01-22 18:41:20.673486: step: 452/530, loss: 0.009089943952858448 2023-01-22 18:41:21.766387: step: 456/530, loss: 0.05749931186437607 2023-01-22 18:41:22.851562: step: 460/530, loss: 0.002829259494319558 2023-01-22 18:41:23.946065: step: 464/530, loss: 0.0046712858602404594 2023-01-22 18:41:25.045290: step: 468/530, loss: 0.03202364593744278 2023-01-22 18:41:26.150570: step: 472/530, loss: 0.003799722297117114 2023-01-22 18:41:27.254338: step: 476/530, loss: 0.007668789941817522 2023-01-22 18:41:28.344989: step: 480/530, loss: 0.014642185531556606 2023-01-22 18:41:29.452286: step: 484/530, loss: 0.0238353181630373 2023-01-22 18:41:30.568519: step: 488/530, loss: 0.006100240629166365 2023-01-22 18:41:31.663403: step: 492/530, loss: 0.0009572201524861157 2023-01-22 18:41:32.774159: step: 496/530, loss: 0.0013079307973384857 2023-01-22 18:41:33.882846: step: 500/530, loss: 0.020869150757789612 2023-01-22 18:41:34.976241: step: 504/530, loss: 0.009384731762111187 2023-01-22 18:41:36.052256: step: 508/530, loss: 0.009377263486385345 2023-01-22 18:41:37.134703: step: 512/530, loss: 0.001966709503903985 2023-01-22 18:41:38.219964: step: 516/530, loss: 0.002783228876069188 2023-01-22 18:41:39.304487: step: 520/530, loss: 0.002126112813130021 2023-01-22 18:41:40.415986: step: 524/530, loss: 0.001104741240851581 2023-01-22 18:41:41.537852: step: 528/530, loss: 0.006545455195009708 2023-01-22 18:41:42.649723: step: 532/530, loss: 0.009132733568549156 2023-01-22 18:41:43.756156: step: 536/530, loss: 1.1474792700028047e-05 2023-01-22 18:41:44.838335: step: 540/530, loss: 0.02148590050637722 2023-01-22 18:41:45.952529: step: 544/530, loss: 0.003492011921480298 2023-01-22 18:41:47.069384: step: 548/530, loss: 0.0037010449450463057 2023-01-22 18:41:48.163429: step: 552/530, loss: 0.003186080139130354 2023-01-22 18:41:49.259226: step: 556/530, loss: 0.012086662463843822 2023-01-22 18:41:50.363781: step: 560/530, loss: 0.004258180037140846 2023-01-22 18:41:51.493545: step: 564/530, loss: 0.0064422027207911015 2023-01-22 18:41:52.603644: step: 568/530, loss: 0.010450919158756733 2023-01-22 18:41:53.678805: step: 572/530, loss: 0.00021632964489981532 2023-01-22 18:41:54.777540: step: 576/530, loss: 0.0028493760619312525 2023-01-22 18:41:55.867863: step: 580/530, loss: 0.0034244342241436243 2023-01-22 18:41:56.966468: step: 584/530, loss: 0.008110796101391315 2023-01-22 18:41:58.091909: step: 588/530, loss: 0.0013099772622808814 2023-01-22 18:41:59.194801: step: 592/530, loss: 0.00390882370993495 2023-01-22 18:42:00.300980: step: 596/530, loss: 0.006104831583797932 2023-01-22 18:42:01.385462: step: 600/530, loss: 0.003616774221882224 2023-01-22 18:42:02.490142: step: 604/530, loss: 0.00127408467233181 2023-01-22 18:42:03.593321: step: 608/530, loss: 0.0002809033030644059 2023-01-22 18:42:04.704521: step: 612/530, loss: 0.0034628703724592924 2023-01-22 18:42:05.799238: step: 616/530, loss: 0.001268115476705134 2023-01-22 18:42:06.894254: step: 620/530, loss: 0.007326859049499035 2023-01-22 18:42:08.008000: step: 624/530, loss: 0.003486846573650837 2023-01-22 18:42:09.123167: step: 628/530, loss: 0.0013649256434291601 2023-01-22 18:42:10.223886: step: 632/530, loss: 0.003663488896563649 2023-01-22 18:42:11.354255: step: 636/530, loss: 0.003642222611233592 2023-01-22 18:42:12.471814: step: 640/530, loss: 0.014086704701185226 2023-01-22 18:42:13.575174: step: 644/530, loss: 0.011483301408588886 2023-01-22 18:42:14.695180: step: 648/530, loss: 0.014000587165355682 2023-01-22 18:42:15.787707: step: 652/530, loss: 0.0019541641231626272 2023-01-22 18:42:16.890703: step: 656/530, loss: 0.003688916563987732 2023-01-22 18:42:17.948576: step: 660/530, loss: 0.004820521920919418 2023-01-22 18:42:19.028918: step: 664/530, loss: 0.0037048442754894495 2023-01-22 18:42:20.130700: step: 668/530, loss: 0.00088413868797943 2023-01-22 18:42:21.240851: step: 672/530, loss: 0.008120663464069366 2023-01-22 18:42:22.322660: step: 676/530, loss: 0.0010722496081143618 2023-01-22 18:42:23.402770: step: 680/530, loss: 0.0059935906901955605 2023-01-22 18:42:24.511513: step: 684/530, loss: 0.004710780922323465 2023-01-22 18:42:25.621207: step: 688/530, loss: 0.002258643275126815 2023-01-22 18:42:26.716189: step: 692/530, loss: 0.010286723263561726 2023-01-22 18:42:27.832316: step: 696/530, loss: 0.0005337955080904067 2023-01-22 18:42:28.943029: step: 700/530, loss: 0.0029301673639565706 2023-01-22 18:42:30.029926: step: 704/530, loss: 0.0010197005467489362 2023-01-22 18:42:31.119476: step: 708/530, loss: 0.00235172500833869 2023-01-22 18:42:32.223573: step: 712/530, loss: 4.155106125836028e-06 2023-01-22 18:42:33.334595: step: 716/530, loss: 0.0037140788044780493 2023-01-22 18:42:34.471457: step: 720/530, loss: 0.016127701848745346 2023-01-22 18:42:35.553750: step: 724/530, loss: 0.0005109111662022769 2023-01-22 18:42:36.629712: step: 728/530, loss: 0.006089877337217331 2023-01-22 18:42:37.746152: step: 732/530, loss: 0.005313365254551172 2023-01-22 18:42:38.848613: step: 736/530, loss: 0.0014886532444506884 2023-01-22 18:42:39.948960: step: 740/530, loss: 0.00926622562110424 2023-01-22 18:42:41.062999: step: 744/530, loss: 0.0006086198263801634 2023-01-22 18:42:42.189694: step: 748/530, loss: 0.010885899886488914 2023-01-22 18:42:43.312560: step: 752/530, loss: 0.0059586940333247185 2023-01-22 18:42:44.439487: step: 756/530, loss: 0.005535410717129707 2023-01-22 18:42:45.553813: step: 760/530, loss: 0.007350731175392866 2023-01-22 18:42:46.653626: step: 764/530, loss: 0.0009643484372645617 2023-01-22 18:42:47.760868: step: 768/530, loss: 0.006084567867219448 2023-01-22 18:42:48.855004: step: 772/530, loss: 0.01721637323498726 2023-01-22 18:42:49.962897: step: 776/530, loss: 0.007361912168562412 2023-01-22 18:42:51.062502: step: 780/530, loss: 0.00501954136416316 2023-01-22 18:42:52.141517: step: 784/530, loss: 0.017124975100159645 2023-01-22 18:42:53.224277: step: 788/530, loss: 0.0024047335609793663 2023-01-22 18:42:54.325538: step: 792/530, loss: 0.008885848335921764 2023-01-22 18:42:55.407178: step: 796/530, loss: 0.00019390931993257254 2023-01-22 18:42:56.508666: step: 800/530, loss: 0.0064721559174358845 2023-01-22 18:42:57.609951: step: 804/530, loss: 0.00936433020979166 2023-01-22 18:42:58.692796: step: 808/530, loss: 0.008190997876226902 2023-01-22 18:42:59.794437: step: 812/530, loss: 0.00391278974711895 2023-01-22 18:43:00.896893: step: 816/530, loss: 0.005585444159805775 2023-01-22 18:43:01.994604: step: 820/530, loss: 0.0018051897641271353 2023-01-22 18:43:03.120689: step: 824/530, loss: 0.00956685934215784 2023-01-22 18:43:04.225225: step: 828/530, loss: 0.004708088468760252 2023-01-22 18:43:05.345999: step: 832/530, loss: 0.012936240062117577 2023-01-22 18:43:06.457131: step: 836/530, loss: 0.00329538993537426 2023-01-22 18:43:07.533267: step: 840/530, loss: 0.01207366306334734 2023-01-22 18:43:08.636025: step: 844/530, loss: 0.004577316343784332 2023-01-22 18:43:09.742197: step: 848/530, loss: 0.006770789623260498 2023-01-22 18:43:10.844306: step: 852/530, loss: 1.0023153436122811e-06 2023-01-22 18:43:11.949134: step: 856/530, loss: 0.0012699918588623405 2023-01-22 18:43:13.047822: step: 860/530, loss: 0.0027047626208513975 2023-01-22 18:43:14.186135: step: 864/530, loss: 0.00703151011839509 2023-01-22 18:43:15.293596: step: 868/530, loss: 0.00563738401979208 2023-01-22 18:43:16.396550: step: 872/530, loss: 0.014759116806089878 2023-01-22 18:43:17.547692: step: 876/530, loss: 0.004694843199104071 2023-01-22 18:43:18.638989: step: 880/530, loss: 0.0023958419915288687 2023-01-22 18:43:19.748555: step: 884/530, loss: 0.0009593351278454065 2023-01-22 18:43:20.836028: step: 888/530, loss: 0.005466763861477375 2023-01-22 18:43:21.938302: step: 892/530, loss: 0.007187244016677141 2023-01-22 18:43:23.058643: step: 896/530, loss: 0.0025142570957541466 2023-01-22 18:43:24.169156: step: 900/530, loss: 0.004243083298206329 2023-01-22 18:43:25.259637: step: 904/530, loss: 0.0016123928362503648 2023-01-22 18:43:26.354006: step: 908/530, loss: 0.0074295299127697945 2023-01-22 18:43:27.476687: step: 912/530, loss: 0.007709177676588297 2023-01-22 18:43:28.579130: step: 916/530, loss: 0.01350318267941475 2023-01-22 18:43:29.690191: step: 920/530, loss: 0.002081478713080287 2023-01-22 18:43:30.790968: step: 924/530, loss: 0.006151957903057337 2023-01-22 18:43:31.881904: step: 928/530, loss: 0.0008753815782256424 2023-01-22 18:43:32.989964: step: 932/530, loss: 0.010530886240303516 2023-01-22 18:43:34.080106: step: 936/530, loss: 0.0027114395052194595 2023-01-22 18:43:35.196582: step: 940/530, loss: 0.002038032514974475 2023-01-22 18:43:36.313357: step: 944/530, loss: 0.0014491023030132055 2023-01-22 18:43:37.421888: step: 948/530, loss: 0.04799647256731987 2023-01-22 18:43:38.515511: step: 952/530, loss: 0.011955811642110348 2023-01-22 18:43:39.641733: step: 956/530, loss: 0.003184965346008539 2023-01-22 18:43:40.719869: step: 960/530, loss: 0.00422566756606102 2023-01-22 18:43:41.828537: step: 964/530, loss: 0.007717070635408163 2023-01-22 18:43:42.922714: step: 968/530, loss: 0.0023763130884617567 2023-01-22 18:43:44.025570: step: 972/530, loss: 0.008148809894919395 2023-01-22 18:43:45.124602: step: 976/530, loss: 0.0048790560103952885 2023-01-22 18:43:46.218930: step: 980/530, loss: 0.0020296794828027487 2023-01-22 18:43:47.330334: step: 984/530, loss: 0.0063913497142493725 2023-01-22 18:43:48.422758: step: 988/530, loss: 0.0021754205226898193 2023-01-22 18:43:49.530665: step: 992/530, loss: 0.0029841738287359476 2023-01-22 18:43:50.646511: step: 996/530, loss: 0.00038652989314869046 2023-01-22 18:43:51.727559: step: 1000/530, loss: 0.004347706213593483 2023-01-22 18:43:52.832971: step: 1004/530, loss: 0.011413280852138996 2023-01-22 18:43:53.933687: step: 1008/530, loss: 0.005719151347875595 2023-01-22 18:43:55.038259: step: 1012/530, loss: 0.02083134651184082 2023-01-22 18:43:56.132297: step: 1016/530, loss: 0.00015534705016762018 2023-01-22 18:43:57.216713: step: 1020/530, loss: 0.010990736074745655 2023-01-22 18:43:58.326538: step: 1024/530, loss: 0.003862551413476467 2023-01-22 18:43:59.435014: step: 1028/530, loss: 0.007739650085568428 2023-01-22 18:44:00.535147: step: 1032/530, loss: 0.003504781750962138 2023-01-22 18:44:01.644763: step: 1036/530, loss: 0.008097977377474308 2023-01-22 18:44:02.768325: step: 1040/530, loss: 0.0045357379131019115 2023-01-22 18:44:03.888182: step: 1044/530, loss: 0.009852608665823936 2023-01-22 18:44:04.982134: step: 1048/530, loss: 0.0010357053251937032 2023-01-22 18:44:06.080467: step: 1052/530, loss: 0.0044439793564379215 2023-01-22 18:44:07.158072: step: 1056/530, loss: 1.589901694387663e-05 2023-01-22 18:44:08.270367: step: 1060/530, loss: 0.011970419436693192 2023-01-22 18:44:09.363287: step: 1064/530, loss: 0.0026482355315238237 2023-01-22 18:44:10.477131: step: 1068/530, loss: 0.00543260108679533 2023-01-22 18:44:11.572745: step: 1072/530, loss: 0.004344042856246233 2023-01-22 18:44:12.673865: step: 1076/530, loss: 0.001634949236176908 2023-01-22 18:44:13.788313: step: 1080/530, loss: 0.010718392208218575 2023-01-22 18:44:14.898459: step: 1084/530, loss: 0.00682159373536706 2023-01-22 18:44:15.996929: step: 1088/530, loss: 0.00335360923781991 2023-01-22 18:44:17.094904: step: 1092/530, loss: 0.006648879498243332 2023-01-22 18:44:18.182369: step: 1096/530, loss: 0.0009464729228056967 2023-01-22 18:44:19.290644: step: 1100/530, loss: 0.05777476727962494 2023-01-22 18:44:20.385497: step: 1104/530, loss: 0.0010224033612757921 2023-01-22 18:44:21.501573: step: 1108/530, loss: 0.010388949885964394 2023-01-22 18:44:22.594998: step: 1112/530, loss: 0.01638748124241829 2023-01-22 18:44:23.700083: step: 1116/530, loss: 0.00656832056120038 2023-01-22 18:44:24.775070: step: 1120/530, loss: 0.001014142413623631 2023-01-22 18:44:25.844781: step: 1124/530, loss: 0.002948155626654625 2023-01-22 18:44:26.939722: step: 1128/530, loss: 0.0008527644677087665 2023-01-22 18:44:28.038925: step: 1132/530, loss: 0.004900769796222448 2023-01-22 18:44:29.144187: step: 1136/530, loss: 0.0004243611474521458 2023-01-22 18:44:30.240225: step: 1140/530, loss: 0.002492793370038271 2023-01-22 18:44:31.351574: step: 1144/530, loss: 0.005905480124056339 2023-01-22 18:44:32.470344: step: 1148/530, loss: 0.011737021617591381 2023-01-22 18:44:33.576356: step: 1152/530, loss: 0.010104364715516567 2023-01-22 18:44:34.679636: step: 1156/530, loss: 0.0032714896369725466 2023-01-22 18:44:35.773446: step: 1160/530, loss: 0.004936861339956522 2023-01-22 18:44:36.875899: step: 1164/530, loss: 0.00797466840595007 2023-01-22 18:44:37.950526: step: 1168/530, loss: 0.0021329522132873535 2023-01-22 18:44:39.062135: step: 1172/530, loss: 0.00536087341606617 2023-01-22 18:44:40.179232: step: 1176/530, loss: 0.003951833583414555 2023-01-22 18:44:41.273321: step: 1180/530, loss: 0.008810511790215969 2023-01-22 18:44:42.373563: step: 1184/530, loss: 0.04611946642398834 2023-01-22 18:44:43.475587: step: 1188/530, loss: 0.022184358909726143 2023-01-22 18:44:44.572301: step: 1192/530, loss: 0.004205614328384399 2023-01-22 18:44:45.663789: step: 1196/530, loss: 0.0005284690414555371 2023-01-22 18:44:46.755210: step: 1200/530, loss: 0.004280883818864822 2023-01-22 18:44:47.872945: step: 1204/530, loss: 0.003171307034790516 2023-01-22 18:44:48.981414: step: 1208/530, loss: 0.007054960820823908 2023-01-22 18:44:50.077433: step: 1212/530, loss: 0.005159756634384394 2023-01-22 18:44:51.183363: step: 1216/530, loss: 0.0030938643030822277 2023-01-22 18:44:52.287822: step: 1220/530, loss: 0.01114040520042181 2023-01-22 18:44:53.399641: step: 1224/530, loss: 0.020213384181261063 2023-01-22 18:44:54.508268: step: 1228/530, loss: 0.007830311544239521 2023-01-22 18:44:55.604397: step: 1232/530, loss: 0.006653353571891785 2023-01-22 18:44:56.715241: step: 1236/530, loss: 0.010676193051040173 2023-01-22 18:44:57.843940: step: 1240/530, loss: 0.007289595436304808 2023-01-22 18:44:58.938392: step: 1244/530, loss: 0.0049084085039794445 2023-01-22 18:45:00.044350: step: 1248/530, loss: 0.029946664348244667 2023-01-22 18:45:01.132760: step: 1252/530, loss: 0.006143920123577118 2023-01-22 18:45:02.226403: step: 1256/530, loss: 0.0018259295029565692 2023-01-22 18:45:03.323819: step: 1260/530, loss: 0.009663070552051067 2023-01-22 18:45:04.415545: step: 1264/530, loss: 0.0010316005209460855 2023-01-22 18:45:05.519521: step: 1268/530, loss: 0.003054466098546982 2023-01-22 18:45:06.630670: step: 1272/530, loss: 0.005911185871809721 2023-01-22 18:45:07.761087: step: 1276/530, loss: 0.0035121699329465628 2023-01-22 18:45:08.857635: step: 1280/530, loss: 0.030863603577017784 2023-01-22 18:45:09.965532: step: 1284/530, loss: 0.02290409430861473 2023-01-22 18:45:11.082515: step: 1288/530, loss: 0.004529096651822329 2023-01-22 18:45:12.179264: step: 1292/530, loss: 0.010354121215641499 2023-01-22 18:45:13.279798: step: 1296/530, loss: 0.00481444364413619 2023-01-22 18:45:14.377871: step: 1300/530, loss: 0.007985670119524002 2023-01-22 18:45:15.481632: step: 1304/530, loss: 0.03664156794548035 2023-01-22 18:45:16.604363: step: 1308/530, loss: 0.002835296094417572 2023-01-22 18:45:17.713155: step: 1312/530, loss: 0.00440608337521553 2023-01-22 18:45:18.813952: step: 1316/530, loss: 0.004514886066317558 2023-01-22 18:45:19.904425: step: 1320/530, loss: 0.003778372658416629 2023-01-22 18:45:21.005487: step: 1324/530, loss: 0.0034132925793528557 2023-01-22 18:45:22.098054: step: 1328/530, loss: 0.002136263297870755 2023-01-22 18:45:23.186190: step: 1332/530, loss: 0.002274127444252372 2023-01-22 18:45:24.263358: step: 1336/530, loss: 0.0010393350385129452 2023-01-22 18:45:25.357414: step: 1340/530, loss: 0.019602840766310692 2023-01-22 18:45:26.470544: step: 1344/530, loss: 0.0013386289356276393 2023-01-22 18:45:27.570659: step: 1348/530, loss: 0.006865911651402712 2023-01-22 18:45:28.663046: step: 1352/530, loss: 0.005287148989737034 2023-01-22 18:45:29.753354: step: 1356/530, loss: 0.00351408077403903 2023-01-22 18:45:30.869552: step: 1360/530, loss: 0.016778897494077682 2023-01-22 18:45:31.969429: step: 1364/530, loss: 0.009416652843356133 2023-01-22 18:45:33.061494: step: 1368/530, loss: 0.0018788962624967098 2023-01-22 18:45:34.170752: step: 1372/530, loss: 0.007068673148751259 2023-01-22 18:45:35.270767: step: 1376/530, loss: 0.003668523859232664 2023-01-22 18:45:36.361222: step: 1380/530, loss: 0.0065972814336419106 2023-01-22 18:45:37.453069: step: 1384/530, loss: 0.004082637373358011 2023-01-22 18:45:38.533472: step: 1388/530, loss: 0.0013107869308441877 2023-01-22 18:45:39.630415: step: 1392/530, loss: 0.017675383016467094 2023-01-22 18:45:40.744758: step: 1396/530, loss: 0.004469520412385464 2023-01-22 18:45:41.849199: step: 1400/530, loss: 0.004404785577207804 2023-01-22 18:45:42.952952: step: 1404/530, loss: 0.005567232612520456 2023-01-22 18:45:44.047605: step: 1408/530, loss: 0.004682925529778004 2023-01-22 18:45:45.135439: step: 1412/530, loss: 0.02175498753786087 2023-01-22 18:45:46.244629: step: 1416/530, loss: 0.012862207368016243 2023-01-22 18:45:47.329270: step: 1420/530, loss: 0.0 2023-01-22 18:45:48.445932: step: 1424/530, loss: 0.0008108131005428731 2023-01-22 18:45:49.547323: step: 1428/530, loss: 0.0012629760894924402 2023-01-22 18:45:50.650550: step: 1432/530, loss: 0.005576068535447121 2023-01-22 18:45:51.758524: step: 1436/530, loss: 0.015617192722856998 2023-01-22 18:45:52.842402: step: 1440/530, loss: 0.00028293757350184023 2023-01-22 18:45:53.932056: step: 1444/530, loss: 0.007297741714864969 2023-01-22 18:45:55.033595: step: 1448/530, loss: 0.0019038491882383823 2023-01-22 18:45:56.144053: step: 1452/530, loss: 0.0021815032232552767 2023-01-22 18:45:57.254404: step: 1456/530, loss: 0.0028231716714799404 2023-01-22 18:45:58.379205: step: 1460/530, loss: 0.0028600329533219337 2023-01-22 18:45:59.462502: step: 1464/530, loss: 0.0017172808293253183 2023-01-22 18:46:00.564539: step: 1468/530, loss: 0.002904909197241068 2023-01-22 18:46:01.661641: step: 1472/530, loss: 0.006400510668754578 2023-01-22 18:46:02.752360: step: 1476/530, loss: 0.005666607525199652 2023-01-22 18:46:03.853658: step: 1480/530, loss: 0.013713116757571697 2023-01-22 18:46:04.943590: step: 1484/530, loss: 0.005708231590688229 2023-01-22 18:46:06.047411: step: 1488/530, loss: 0.005585353821516037 2023-01-22 18:46:07.147895: step: 1492/530, loss: 0.00759673397988081 2023-01-22 18:46:08.247725: step: 1496/530, loss: 0.003911247942596674 2023-01-22 18:46:09.339141: step: 1500/530, loss: 0.0010523127857595682 2023-01-22 18:46:10.415717: step: 1504/530, loss: 0.005459906999021769 2023-01-22 18:46:11.528344: step: 1508/530, loss: 0.0017450046725571156 2023-01-22 18:46:12.647615: step: 1512/530, loss: 0.004098229110240936 2023-01-22 18:46:13.761164: step: 1516/530, loss: 0.009447664953768253 2023-01-22 18:46:14.849634: step: 1520/530, loss: 0.0018781708786264062 2023-01-22 18:46:15.967887: step: 1524/530, loss: 0.003473359625786543 2023-01-22 18:46:17.115164: step: 1528/530, loss: 0.01289084181189537 2023-01-22 18:46:18.206097: step: 1532/530, loss: 0.0019815952982753515 2023-01-22 18:46:19.317935: step: 1536/530, loss: 0.003952621947973967 2023-01-22 18:46:20.415327: step: 1540/530, loss: 0.027720943093299866 2023-01-22 18:46:21.498901: step: 1544/530, loss: 0.0006244656979106367 2023-01-22 18:46:22.584535: step: 1548/530, loss: 0.0027780826203525066 2023-01-22 18:46:23.685672: step: 1552/530, loss: 0.014304236508905888 2023-01-22 18:46:24.789569: step: 1556/530, loss: 0.005743764340877533 2023-01-22 18:46:25.893109: step: 1560/530, loss: 0.004498668015003204 2023-01-22 18:46:27.002206: step: 1564/530, loss: 0.0001885459787445143 2023-01-22 18:46:28.103434: step: 1568/530, loss: 0.03931552171707153 2023-01-22 18:46:29.213421: step: 1572/530, loss: 0.0117438193410635 2023-01-22 18:46:30.306043: step: 1576/530, loss: 0.008759861811995506 2023-01-22 18:46:31.391955: step: 1580/530, loss: 0.004414891358464956 2023-01-22 18:46:32.494977: step: 1584/530, loss: 0.015773741528391838 2023-01-22 18:46:33.627898: step: 1588/530, loss: 0.014878548681735992 2023-01-22 18:46:34.725656: step: 1592/530, loss: 0.022531064227223396 2023-01-22 18:46:35.827101: step: 1596/530, loss: 0.00883167702704668 2023-01-22 18:46:36.938096: step: 1600/530, loss: 0.0033920041751116514 2023-01-22 18:46:38.039969: step: 1604/530, loss: 0.0026087721344083548 2023-01-22 18:46:39.123325: step: 1608/530, loss: 0.013353990390896797 2023-01-22 18:46:40.196831: step: 1612/530, loss: 0.009016508236527443 2023-01-22 18:46:41.300372: step: 1616/530, loss: 0.01207042671740055 2023-01-22 18:46:42.446140: step: 1620/530, loss: 0.007473519071936607 2023-01-22 18:46:43.541534: step: 1624/530, loss: 0.00028923607897013426 2023-01-22 18:46:44.648672: step: 1628/530, loss: 0.008898764848709106 2023-01-22 18:46:45.724114: step: 1632/530, loss: 0.005579464137554169 2023-01-22 18:46:46.854324: step: 1636/530, loss: 0.003116974839940667 2023-01-22 18:46:47.948690: step: 1640/530, loss: 0.000852027500513941 2023-01-22 18:46:49.044588: step: 1644/530, loss: 0.0015090826200321317 2023-01-22 18:46:50.168033: step: 1648/530, loss: 0.001047214725986123 2023-01-22 18:46:51.269775: step: 1652/530, loss: 0.004282757639884949 2023-01-22 18:46:52.351306: step: 1656/530, loss: 0.0025495090521872044 2023-01-22 18:46:53.460706: step: 1660/530, loss: 0.00820249319076538 2023-01-22 18:46:54.558447: step: 1664/530, loss: 0.0005332635482773185 2023-01-22 18:46:55.659460: step: 1668/530, loss: 0.0013903120998293161 2023-01-22 18:46:56.759860: step: 1672/530, loss: 0.007464383263140917 2023-01-22 18:46:57.889399: step: 1676/530, loss: 0.007312059868127108 2023-01-22 18:46:59.016439: step: 1680/530, loss: 0.006925118621438742 2023-01-22 18:47:00.109754: step: 1684/530, loss: 0.00024333904730156064 2023-01-22 18:47:01.216882: step: 1688/530, loss: 0.0006623081862926483 2023-01-22 18:47:02.306631: step: 1692/530, loss: 0.00014406631817109883 2023-01-22 18:47:03.406282: step: 1696/530, loss: 0.005367347039282322 2023-01-22 18:47:04.499706: step: 1700/530, loss: 0.01579924114048481 2023-01-22 18:47:05.604818: step: 1704/530, loss: 0.0027582456823438406 2023-01-22 18:47:06.734579: step: 1708/530, loss: 0.027939584106206894 2023-01-22 18:47:07.830939: step: 1712/530, loss: 0.0029140375554561615 2023-01-22 18:47:08.931004: step: 1716/530, loss: 0.0007726530893705785 2023-01-22 18:47:10.019211: step: 1720/530, loss: 0.008381947875022888 2023-01-22 18:47:11.115548: step: 1724/530, loss: 0.005194207187741995 2023-01-22 18:47:12.227621: step: 1728/530, loss: 2.8067463063052855e-05 2023-01-22 18:47:13.340590: step: 1732/530, loss: 0.004748601000756025 2023-01-22 18:47:14.444602: step: 1736/530, loss: 0.004202454816550016 2023-01-22 18:47:15.539729: step: 1740/530, loss: 0.005364618264138699 2023-01-22 18:47:16.647322: step: 1744/530, loss: 0.0045860521495342255 2023-01-22 18:47:17.737583: step: 1748/530, loss: 0.0003562755009625107 2023-01-22 18:47:18.829900: step: 1752/530, loss: 0.002667174907401204 2023-01-22 18:47:19.938342: step: 1756/530, loss: 0.017062919214367867 2023-01-22 18:47:21.031850: step: 1760/530, loss: 0.0016122220549732447 2023-01-22 18:47:22.130250: step: 1764/530, loss: 0.0038395128212869167 2023-01-22 18:47:23.219998: step: 1768/530, loss: 0.0067592100240290165 2023-01-22 18:47:24.297279: step: 1772/530, loss: 0.005635429173707962 2023-01-22 18:47:25.398916: step: 1776/530, loss: 0.0037499871104955673 2023-01-22 18:47:26.517132: step: 1780/530, loss: 0.009561735205352306 2023-01-22 18:47:27.616713: step: 1784/530, loss: 0.009552452713251114 2023-01-22 18:47:28.709344: step: 1788/530, loss: 0.0048697213642299175 2023-01-22 18:47:29.802546: step: 1792/530, loss: 0.005792495794594288 2023-01-22 18:47:30.900197: step: 1796/530, loss: 0.001262329868040979 2023-01-22 18:47:32.036557: step: 1800/530, loss: 0.008863368071615696 2023-01-22 18:47:33.138583: step: 1804/530, loss: 0.0012546515790745616 2023-01-22 18:47:34.241487: step: 1808/530, loss: 0.0063784136436879635 2023-01-22 18:47:35.357293: step: 1812/530, loss: 0.00655109528452158 2023-01-22 18:47:36.459335: step: 1816/530, loss: 0.005710633937269449 2023-01-22 18:47:37.555340: step: 1820/530, loss: 0.0023225401528179646 2023-01-22 18:47:38.654760: step: 1824/530, loss: 0.002122816164046526 2023-01-22 18:47:39.787150: step: 1828/530, loss: 0.012034503743052483 2023-01-22 18:47:40.890276: step: 1832/530, loss: 0.005654426291584969 2023-01-22 18:47:42.023118: step: 1836/530, loss: 0.05996264889836311 2023-01-22 18:47:43.117215: step: 1840/530, loss: 0.0023963332641869783 2023-01-22 18:47:44.227981: step: 1844/530, loss: 0.004057222977280617 2023-01-22 18:47:45.319529: step: 1848/530, loss: 0.004797052592039108 2023-01-22 18:47:46.438592: step: 1852/530, loss: 0.018800226971507072 2023-01-22 18:47:47.525977: step: 1856/530, loss: 0.012684672139585018 2023-01-22 18:47:48.620557: step: 1860/530, loss: 0.005445479415357113 2023-01-22 18:47:49.735390: step: 1864/530, loss: 0.006310692522674799 2023-01-22 18:47:50.831948: step: 1868/530, loss: 0.0058257682248950005 2023-01-22 18:47:51.922011: step: 1872/530, loss: 0.007973291911184788 2023-01-22 18:47:53.028320: step: 1876/530, loss: 0.00021161425684113055 2023-01-22 18:47:54.132046: step: 1880/530, loss: 0.003784623695537448 2023-01-22 18:47:55.231498: step: 1884/530, loss: 0.003617755603045225 2023-01-22 18:47:56.320594: step: 1888/530, loss: 0.005014495924115181 2023-01-22 18:47:57.428472: step: 1892/530, loss: 0.007986443117260933 2023-01-22 18:47:58.532219: step: 1896/530, loss: 0.0638704001903534 2023-01-22 18:47:59.646919: step: 1900/530, loss: 0.01315513625741005 2023-01-22 18:48:00.739871: step: 1904/530, loss: 0.003585227532312274 2023-01-22 18:48:01.848595: step: 1908/530, loss: 0.010146183893084526 2023-01-22 18:48:02.924890: step: 1912/530, loss: 0.0002532742510084063 2023-01-22 18:48:04.015697: step: 1916/530, loss: 0.008187280967831612 2023-01-22 18:48:05.145122: step: 1920/530, loss: 0.004738227464258671 2023-01-22 18:48:06.243016: step: 1924/530, loss: 0.0065395706333220005 2023-01-22 18:48:07.354813: step: 1928/530, loss: 0.002547272713854909 2023-01-22 18:48:08.452686: step: 1932/530, loss: 0.03828773647546768 2023-01-22 18:48:09.549771: step: 1936/530, loss: 0.026910273358225822 2023-01-22 18:48:10.638199: step: 1940/530, loss: 0.016570253297686577 2023-01-22 18:48:11.741100: step: 1944/530, loss: 0.0017694535199552774 2023-01-22 18:48:12.862669: step: 1948/530, loss: 0.0058820126578211784 2023-01-22 18:48:13.981837: step: 1952/530, loss: 0.0047866362147033215 2023-01-22 18:48:15.068186: step: 1956/530, loss: 0.0031540365889668465 2023-01-22 18:48:16.179958: step: 1960/530, loss: 0.009054695256054401 2023-01-22 18:48:17.276903: step: 1964/530, loss: 0.00031283817952498794 2023-01-22 18:48:18.360684: step: 1968/530, loss: 0.011626465246081352 2023-01-22 18:48:19.465110: step: 1972/530, loss: 0.004292723257094622 2023-01-22 18:48:20.565934: step: 1976/530, loss: 0.0026255559641867876 2023-01-22 18:48:21.710040: step: 1980/530, loss: 0.014015048742294312 2023-01-22 18:48:22.831868: step: 1984/530, loss: 0.01889391802251339 2023-01-22 18:48:23.941744: step: 1988/530, loss: 0.0008177540730684996 2023-01-22 18:48:25.031863: step: 1992/530, loss: 0.0025048761162906885 2023-01-22 18:48:26.138882: step: 1996/530, loss: 0.006152528803795576 2023-01-22 18:48:27.251485: step: 2000/530, loss: 0.02581629902124405 2023-01-22 18:48:28.369112: step: 2004/530, loss: 0.0019788651261478662 2023-01-22 18:48:29.471012: step: 2008/530, loss: 0.004808387719094753 2023-01-22 18:48:30.571677: step: 2012/530, loss: 0.0006217002519406378 2023-01-22 18:48:31.670817: step: 2016/530, loss: 0.01565537042915821 2023-01-22 18:48:32.788093: step: 2020/530, loss: 0.004735218361020088 2023-01-22 18:48:33.870443: step: 2024/530, loss: 0.0012645252281799912 2023-01-22 18:48:34.964792: step: 2028/530, loss: 0.004584374371916056 2023-01-22 18:48:36.069446: step: 2032/530, loss: 0.011293581686913967 2023-01-22 18:48:37.159312: step: 2036/530, loss: 0.004231262020766735 2023-01-22 18:48:38.242719: step: 2040/530, loss: 0.007557030767202377 2023-01-22 18:48:39.351873: step: 2044/530, loss: 0.0001206692832056433 2023-01-22 18:48:40.427734: step: 2048/530, loss: 0.006060923915356398 2023-01-22 18:48:41.522396: step: 2052/530, loss: 0.020609134808182716 2023-01-22 18:48:42.635522: step: 2056/530, loss: 0.011785211972892284 2023-01-22 18:48:43.763800: step: 2060/530, loss: 0.000952857022639364 2023-01-22 18:48:44.848610: step: 2064/530, loss: 0.0046133059076964855 2023-01-22 18:48:45.953315: step: 2068/530, loss: 0.0043978020548820496 2023-01-22 18:48:47.065665: step: 2072/530, loss: 0.00933991838246584 2023-01-22 18:48:48.172221: step: 2076/530, loss: 0.004743628203868866 2023-01-22 18:48:49.278251: step: 2080/530, loss: 0.18316756188869476 2023-01-22 18:48:50.358890: step: 2084/530, loss: 0.009476578794419765 2023-01-22 18:48:51.462314: step: 2088/530, loss: 0.011847156099975109 2023-01-22 18:48:52.541217: step: 2092/530, loss: 0.006440174765884876 2023-01-22 18:48:53.652687: step: 2096/530, loss: 0.010593869723379612 2023-01-22 18:48:54.736416: step: 2100/530, loss: 0.0010112167801707983 2023-01-22 18:48:55.820383: step: 2104/530, loss: 0.0010628459276631474 2023-01-22 18:48:56.911803: step: 2108/530, loss: 0.004539801739156246 2023-01-22 18:48:58.041820: step: 2112/530, loss: 0.008094402961432934 2023-01-22 18:48:59.133075: step: 2116/530, loss: 0.002351432805880904 2023-01-22 18:49:00.201883: step: 2120/530, loss: 0.011183440685272217 ================================================== Loss: 0.008 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3407029220779221, 'r': 0.3555723095689889, 'f1': 0.3479788433479241}, 'combined': 0.25640546351952304, 'stategy': 1, 'epoch': 8} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3306613475177803, 'r': 0.2806206094661281, 'f1': 0.3035927620869508}, 'combined': 0.18854708382242208, 'stategy': 1, 'epoch': 8} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34964647290162165, 'r': 0.3403579517998708, 'f1': 0.34493969345871517}, 'combined': 0.254166089916948, 'stategy': 1, 'epoch': 8} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.32111883150957476, 'r': 0.28586246128448795, 'f1': 0.30246671727746444}, 'combined': 0.18784775073021476, 'stategy': 1, 'epoch': 8} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34106308060570584, 'r': 0.32423643905779626, 'f1': 0.3324369715631491}, 'combined': 0.24495355799389934, 'stategy': 1, 'epoch': 8} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3473118877755518, 'r': 0.29314083321628503, 'f1': 0.317935400479761}, 'combined': 0.1974546171400621, 'stategy': 1, 'epoch': 8} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 8} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 8} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5208333333333334, 'r': 0.3232758620689655, 'f1': 0.39893617021276595}, 'combined': 0.26595744680851063, 'stategy': 1, 'epoch': 8} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 9 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 18:51:31.178266: step: 4/530, loss: 0.012852641753852367 2023-01-22 18:51:32.277239: step: 8/530, loss: 0.002417398849502206 2023-01-22 18:51:33.350246: step: 12/530, loss: 0.0011995211243629456 2023-01-22 18:51:34.471384: step: 16/530, loss: 0.0010039876215159893 2023-01-22 18:51:35.568990: step: 20/530, loss: 0.00017232468235306442 2023-01-22 18:51:36.672771: step: 24/530, loss: 0.007264132145792246 2023-01-22 18:51:37.746885: step: 28/530, loss: 0.0036720209755003452 2023-01-22 18:51:38.831161: step: 32/530, loss: 0.0048157824203372 2023-01-22 18:51:39.908627: step: 36/530, loss: 0.0034320226404815912 2023-01-22 18:51:41.005085: step: 40/530, loss: 0.003279099939391017 2023-01-22 18:51:42.129880: step: 44/530, loss: 0.0028031456749886274 2023-01-22 18:51:43.227496: step: 48/530, loss: 0.002326064743101597 2023-01-22 18:51:44.329397: step: 52/530, loss: 0.008965677581727505 2023-01-22 18:51:45.409393: step: 56/530, loss: 0.010192080400884151 2023-01-22 18:51:46.507514: step: 60/530, loss: 0.0023942210245877504 2023-01-22 18:51:47.604544: step: 64/530, loss: 0.007135374005883932 2023-01-22 18:51:48.698027: step: 68/530, loss: 4.353479380370118e-05 2023-01-22 18:51:49.803498: step: 72/530, loss: 0.0021611973643302917 2023-01-22 18:51:50.887634: step: 76/530, loss: 0.004792075138539076 2023-01-22 18:51:51.984254: step: 80/530, loss: 0.01676429808139801 2023-01-22 18:51:53.055080: step: 84/530, loss: 0.005350546911358833 2023-01-22 18:51:54.183308: step: 88/530, loss: 0.006298549007624388 2023-01-22 18:51:55.283435: step: 92/530, loss: 0.0003452624077908695 2023-01-22 18:51:56.381208: step: 96/530, loss: 0.0034581469371914864 2023-01-22 18:51:57.482950: step: 100/530, loss: 0.0016276293899863958 2023-01-22 18:51:58.592081: step: 104/530, loss: 0.00324163306504488 2023-01-22 18:51:59.696169: step: 108/530, loss: 0.0009973623091354966 2023-01-22 18:52:00.773865: step: 112/530, loss: 0.0018076226115226746 2023-01-22 18:52:01.855757: step: 116/530, loss: 0.006380291655659676 2023-01-22 18:52:02.952198: step: 120/530, loss: 0.0030232977587729692 2023-01-22 18:52:04.039202: step: 124/530, loss: 0.006191682536154985 2023-01-22 18:52:05.131451: step: 128/530, loss: 0.009679173119366169 2023-01-22 18:52:06.255522: step: 132/530, loss: 0.0016814138507470489 2023-01-22 18:52:07.353932: step: 136/530, loss: 0.000629706250037998 2023-01-22 18:52:08.483732: step: 140/530, loss: 0.006482336670160294 2023-01-22 18:52:09.576890: step: 144/530, loss: 0.003738175146281719 2023-01-22 18:52:10.654726: step: 148/530, loss: 0.0007629310712218285 2023-01-22 18:52:11.755481: step: 152/530, loss: 0.0030066377948969603 2023-01-22 18:52:12.877221: step: 156/530, loss: 0.0031846221536397934 2023-01-22 18:52:13.987818: step: 160/530, loss: 0.004700453020632267 2023-01-22 18:52:15.083742: step: 164/530, loss: 0.0013999439543113112 2023-01-22 18:52:16.187301: step: 168/530, loss: 0.03358696028590202 2023-01-22 18:52:17.298219: step: 172/530, loss: 0.008787048980593681 2023-01-22 18:52:18.399656: step: 176/530, loss: 0.004170938394963741 2023-01-22 18:52:19.502014: step: 180/530, loss: 0.002950782887637615 2023-01-22 18:52:20.586369: step: 184/530, loss: 0.0009335349895991385 2023-01-22 18:52:21.705598: step: 188/530, loss: 0.018743734806776047 2023-01-22 18:52:22.793204: step: 192/530, loss: 0.006596866529434919 2023-01-22 18:52:23.878715: step: 196/530, loss: 0.006678693927824497 2023-01-22 18:52:24.964158: step: 200/530, loss: 0.0031592408195137978 2023-01-22 18:52:26.070053: step: 204/530, loss: 0.002463296055793762 2023-01-22 18:52:27.173530: step: 208/530, loss: 0.003427669405937195 2023-01-22 18:52:28.266997: step: 212/530, loss: 0.011702906340360641 2023-01-22 18:52:29.395092: step: 216/530, loss: 0.008907417766749859 2023-01-22 18:52:30.494498: step: 220/530, loss: 0.008853808045387268 2023-01-22 18:52:31.602116: step: 224/530, loss: 0.010829031467437744 2023-01-22 18:52:32.701658: step: 228/530, loss: 0.0035358441527932882 2023-01-22 18:52:33.826493: step: 232/530, loss: 0.018984684720635414 2023-01-22 18:52:34.917913: step: 236/530, loss: 0.0011065416038036346 2023-01-22 18:52:36.018196: step: 240/530, loss: 0.0008059915853664279 2023-01-22 18:52:37.128501: step: 244/530, loss: 0.0029619589913636446 2023-01-22 18:52:38.236918: step: 248/530, loss: 0.004144147504121065 2023-01-22 18:52:39.334232: step: 252/530, loss: 0.00027097263955511153 2023-01-22 18:52:40.436252: step: 256/530, loss: 0.028288258239626884 2023-01-22 18:52:41.555768: step: 260/530, loss: 0.004978305194526911 2023-01-22 18:52:42.672123: step: 264/530, loss: 0.009526673704385757 2023-01-22 18:52:43.745506: step: 268/530, loss: 0.0008316404419019818 2023-01-22 18:52:44.883240: step: 272/530, loss: 0.0075862654484808445 2023-01-22 18:52:45.974146: step: 276/530, loss: 0.012735490687191486 2023-01-22 18:52:47.053075: step: 280/530, loss: 0.0005930901970714331 2023-01-22 18:52:48.154487: step: 284/530, loss: 0.008498327806591988 2023-01-22 18:52:49.261842: step: 288/530, loss: 0.003878409741446376 2023-01-22 18:52:50.402888: step: 292/530, loss: 0.002927615772932768 2023-01-22 18:52:51.521755: step: 296/530, loss: 0.006158793810755014 2023-01-22 18:52:52.647528: step: 300/530, loss: 0.006205850280821323 2023-01-22 18:52:53.734528: step: 304/530, loss: 0.009309251792728901 2023-01-22 18:52:54.829952: step: 308/530, loss: 0.009339329786598682 2023-01-22 18:52:55.921117: step: 312/530, loss: 0.004272827412933111 2023-01-22 18:52:57.017118: step: 316/530, loss: 0.0005239882739260793 2023-01-22 18:52:58.160506: step: 320/530, loss: 0.0031910634133964777 2023-01-22 18:52:59.261381: step: 324/530, loss: 0.0017521815607324243 2023-01-22 18:53:00.343900: step: 328/530, loss: 0.0010132597526535392 2023-01-22 18:53:01.457932: step: 332/530, loss: 0.002245164243504405 2023-01-22 18:53:02.568895: step: 336/530, loss: 0.001676232204772532 2023-01-22 18:53:03.656678: step: 340/530, loss: 0.0036706961691379547 2023-01-22 18:53:04.758133: step: 344/530, loss: 0.003087942488491535 2023-01-22 18:53:05.851787: step: 348/530, loss: 0.006789413746446371 2023-01-22 18:53:06.938999: step: 352/530, loss: 0.0005472687189467251 2023-01-22 18:53:08.047988: step: 356/530, loss: 0.005121403839439154 2023-01-22 18:53:09.170165: step: 360/530, loss: 0.0042812940664589405 2023-01-22 18:53:10.253332: step: 364/530, loss: 0.003609717357903719 2023-01-22 18:53:11.379388: step: 368/530, loss: 0.0018349169986322522 2023-01-22 18:53:12.492406: step: 372/530, loss: 0.014606616459786892 2023-01-22 18:53:13.576500: step: 376/530, loss: 0.0020804009400308132 2023-01-22 18:53:14.686739: step: 380/530, loss: 0.0035718935541808605 2023-01-22 18:53:15.790935: step: 384/530, loss: 0.006819744128733873 2023-01-22 18:53:16.906885: step: 388/530, loss: 0.00019025173969566822 2023-01-22 18:53:18.008812: step: 392/530, loss: 0.008957646787166595 2023-01-22 18:53:19.093748: step: 396/530, loss: 0.0007106844568625093 2023-01-22 18:53:20.214464: step: 400/530, loss: 0.008181637153029442 2023-01-22 18:53:21.336075: step: 404/530, loss: 0.0022422587499022484 2023-01-22 18:53:22.439934: step: 408/530, loss: 0.008068078197538853 2023-01-22 18:53:23.541203: step: 412/530, loss: 0.004556990694254637 2023-01-22 18:53:24.660055: step: 416/530, loss: 0.0008272951235994697 2023-01-22 18:53:25.741954: step: 420/530, loss: 0.006012100726366043 2023-01-22 18:53:26.821603: step: 424/530, loss: 0.001314446097239852 2023-01-22 18:53:27.924337: step: 428/530, loss: 0.0052610342390835285 2023-01-22 18:53:29.018721: step: 432/530, loss: 0.0009571047849021852 2023-01-22 18:53:30.104863: step: 436/530, loss: 0.0076738083735108376 2023-01-22 18:53:31.191042: step: 440/530, loss: 0.0029224767349660397 2023-01-22 18:53:32.318555: step: 444/530, loss: 0.02174765057861805 2023-01-22 18:53:33.411239: step: 448/530, loss: 0.0008959988481365144 2023-01-22 18:53:34.523161: step: 452/530, loss: 0.015675559639930725 2023-01-22 18:53:35.639524: step: 456/530, loss: 0.008674388751387596 2023-01-22 18:53:36.756315: step: 460/530, loss: 0.01830499991774559 2023-01-22 18:53:37.858222: step: 464/530, loss: 0.0009909734362736344 2023-01-22 18:53:38.936708: step: 468/530, loss: 0.0015118962619453669 2023-01-22 18:53:40.041367: step: 472/530, loss: 0.007263553328812122 2023-01-22 18:53:41.160881: step: 476/530, loss: 0.0 2023-01-22 18:53:42.287468: step: 480/530, loss: 0.0020446141716092825 2023-01-22 18:53:43.409639: step: 484/530, loss: 0.02304811030626297 2023-01-22 18:53:44.519850: step: 488/530, loss: 0.005052995402365923 2023-01-22 18:53:45.613798: step: 492/530, loss: 0.0004195969959255308 2023-01-22 18:53:46.723596: step: 496/530, loss: 0.06983699649572372 2023-01-22 18:53:47.820431: step: 500/530, loss: 0.0017783496296033263 2023-01-22 18:53:48.930380: step: 504/530, loss: 0.0007300215656869113 2023-01-22 18:53:50.046300: step: 508/530, loss: 0.005889096297323704 2023-01-22 18:53:51.166106: step: 512/530, loss: 0.011448380537331104 2023-01-22 18:53:52.260578: step: 516/530, loss: 1.6626150681986474e-05 2023-01-22 18:53:53.354413: step: 520/530, loss: 0.0055013555102050304 2023-01-22 18:53:54.473049: step: 524/530, loss: 0.005656551104038954 2023-01-22 18:53:55.593888: step: 528/530, loss: 0.00023554236395284534 2023-01-22 18:53:56.691304: step: 532/530, loss: 0.005936426110565662 2023-01-22 18:53:57.807206: step: 536/530, loss: 0.005324170924723148 2023-01-22 18:53:58.907712: step: 540/530, loss: 0.005824314896017313 2023-01-22 18:54:00.005022: step: 544/530, loss: 0.0023509550374001265 2023-01-22 18:54:01.097554: step: 548/530, loss: 0.030468204990029335 2023-01-22 18:54:02.190926: step: 552/530, loss: 0.0035597807727754116 2023-01-22 18:54:03.286938: step: 556/530, loss: 0.010581757873296738 2023-01-22 18:54:04.363901: step: 560/530, loss: 0.010156725533306599 2023-01-22 18:54:05.459595: step: 564/530, loss: 0.0016914489679038525 2023-01-22 18:54:06.543037: step: 568/530, loss: 0.0007650958141312003 2023-01-22 18:54:07.633705: step: 572/530, loss: 0.0035633896477520466 2023-01-22 18:54:08.725907: step: 576/530, loss: 0.0007015399751253426 2023-01-22 18:54:09.808725: step: 580/530, loss: 0.0006578704342246056 2023-01-22 18:54:10.895895: step: 584/530, loss: 0.005710997153073549 2023-01-22 18:54:12.003102: step: 588/530, loss: 0.009510494768619537 2023-01-22 18:54:13.103969: step: 592/530, loss: 0.028136061504483223 2023-01-22 18:54:14.215587: step: 596/530, loss: 0.014152660965919495 2023-01-22 18:54:15.318381: step: 600/530, loss: 0.008041109889745712 2023-01-22 18:54:16.414760: step: 604/530, loss: 0.0031933574937283993 2023-01-22 18:54:17.517391: step: 608/530, loss: 0.0004951993469148874 2023-01-22 18:54:18.653325: step: 612/530, loss: 0.007825084961950779 2023-01-22 18:54:19.758862: step: 616/530, loss: 0.0038491194136440754 2023-01-22 18:54:20.851473: step: 620/530, loss: 0.0062204692512750626 2023-01-22 18:54:21.947860: step: 624/530, loss: 0.0022343993186950684 2023-01-22 18:54:23.041900: step: 628/530, loss: 0.0030720075592398643 2023-01-22 18:54:24.147857: step: 632/530, loss: 0.005884266458451748 2023-01-22 18:54:25.247635: step: 636/530, loss: 0.003556633833795786 2023-01-22 18:54:26.358217: step: 640/530, loss: 0.004114823415875435 2023-01-22 18:54:27.459816: step: 644/530, loss: 0.011077985167503357 2023-01-22 18:54:28.550195: step: 648/530, loss: 0.00010280668357154354 2023-01-22 18:54:29.663642: step: 652/530, loss: 0.0008016469073481858 2023-01-22 18:54:30.770586: step: 656/530, loss: 0.005742603912949562 2023-01-22 18:54:31.882617: step: 660/530, loss: 0.008505282923579216 2023-01-22 18:54:32.995626: step: 664/530, loss: 0.00211735931225121 2023-01-22 18:54:34.091753: step: 668/530, loss: 0.0036868590395897627 2023-01-22 18:54:35.202959: step: 672/530, loss: 0.033049263060092926 2023-01-22 18:54:36.312432: step: 676/530, loss: 0.0032268972136080265 2023-01-22 18:54:37.399403: step: 680/530, loss: 0.0022875515278428793 2023-01-22 18:54:38.477801: step: 684/530, loss: 0.0013293405063450336 2023-01-22 18:54:39.582456: step: 688/530, loss: 0.006347678601741791 2023-01-22 18:54:40.689426: step: 692/530, loss: 0.007853042334318161 2023-01-22 18:54:41.796357: step: 696/530, loss: 0.0017268542433157563 2023-01-22 18:54:42.912887: step: 700/530, loss: 0.006198188289999962 2023-01-22 18:54:44.007892: step: 704/530, loss: 0.010438612662255764 2023-01-22 18:54:45.090303: step: 708/530, loss: 0.00693716062232852 2023-01-22 18:54:46.191784: step: 712/530, loss: 0.0028866783250123262 2023-01-22 18:54:47.286760: step: 716/530, loss: 0.00014014098269399256 2023-01-22 18:54:48.388976: step: 720/530, loss: 0.013577362522482872 2023-01-22 18:54:49.479889: step: 724/530, loss: 5.0817641749745235e-05 2023-01-22 18:54:50.586596: step: 728/530, loss: 0.00023314656573347747 2023-01-22 18:54:51.682031: step: 732/530, loss: 0.001911955769173801 2023-01-22 18:54:52.781223: step: 736/530, loss: 0.012397710233926773 2023-01-22 18:54:53.882276: step: 740/530, loss: 0.005772104486823082 2023-01-22 18:54:54.983325: step: 744/530, loss: 0.001831976929679513 2023-01-22 18:54:56.073727: step: 748/530, loss: 0.013668297789990902 2023-01-22 18:54:57.195412: step: 752/530, loss: 0.008609876036643982 2023-01-22 18:54:58.303843: step: 756/530, loss: 0.013752492144703865 2023-01-22 18:54:59.414339: step: 760/530, loss: 0.004622215870767832 2023-01-22 18:55:00.508163: step: 764/530, loss: 0.009318478405475616 2023-01-22 18:55:01.599715: step: 768/530, loss: 0.0001981892273761332 2023-01-22 18:55:02.679524: step: 772/530, loss: 0.005856137257069349 2023-01-22 18:55:03.796532: step: 776/530, loss: 0.0010913341538980603 2023-01-22 18:55:04.882054: step: 780/530, loss: 0.007248550653457642 2023-01-22 18:55:05.974503: step: 784/530, loss: 0.0026998359244316816 2023-01-22 18:55:07.071625: step: 788/530, loss: 0.00705366488546133 2023-01-22 18:55:08.164045: step: 792/530, loss: 0.00720044132322073 2023-01-22 18:55:09.267816: step: 796/530, loss: 0.0012210009153932333 2023-01-22 18:55:10.373006: step: 800/530, loss: 0.002764006843790412 2023-01-22 18:55:11.467636: step: 804/530, loss: 0.00411082711070776 2023-01-22 18:55:12.546412: step: 808/530, loss: 0.006338645238429308 2023-01-22 18:55:13.643194: step: 812/530, loss: 0.001269435859285295 2023-01-22 18:55:14.760903: step: 816/530, loss: 0.010235443711280823 2023-01-22 18:55:15.871682: step: 820/530, loss: 0.0014181012520566583 2023-01-22 18:55:16.978334: step: 824/530, loss: 0.0034648084547370672 2023-01-22 18:55:18.115643: step: 828/530, loss: 0.0005349619896151125 2023-01-22 18:55:19.208978: step: 832/530, loss: 0.025860896334052086 2023-01-22 18:55:20.298579: step: 836/530, loss: 0.009158861823379993 2023-01-22 18:55:21.399818: step: 840/530, loss: 0.012786809355020523 2023-01-22 18:55:22.499777: step: 844/530, loss: 0.0050424253568053246 2023-01-22 18:55:23.586560: step: 848/530, loss: 0.0037137819454073906 2023-01-22 18:55:24.682778: step: 852/530, loss: 0.006844476331025362 2023-01-22 18:55:25.776930: step: 856/530, loss: 0.003874870715662837 2023-01-22 18:55:26.875816: step: 860/530, loss: 0.0028753934893757105 2023-01-22 18:55:27.963742: step: 864/530, loss: 0.0017035690834745765 2023-01-22 18:55:29.048348: step: 868/530, loss: 0.0001334802946075797 2023-01-22 18:55:30.177732: step: 872/530, loss: 0.014125794172286987 2023-01-22 18:55:31.278814: step: 876/530, loss: 0.023393521085381508 2023-01-22 18:55:32.340955: step: 880/530, loss: 0.0006625691312365234 2023-01-22 18:55:33.430251: step: 884/530, loss: 0.012671408243477345 2023-01-22 18:55:34.531744: step: 888/530, loss: 0.002146540442481637 2023-01-22 18:55:35.611868: step: 892/530, loss: 0.007133450359106064 2023-01-22 18:55:36.690857: step: 896/530, loss: 0.004140970762819052 2023-01-22 18:55:37.800314: step: 900/530, loss: 0.0025890804827213287 2023-01-22 18:55:38.899369: step: 904/530, loss: 0.00036826045834459364 2023-01-22 18:55:39.983892: step: 908/530, loss: 0.0014974417863413692 2023-01-22 18:55:41.066985: step: 912/530, loss: 0.004251014441251755 2023-01-22 18:55:42.157217: step: 916/530, loss: 0.010467146523296833 2023-01-22 18:55:43.256482: step: 920/530, loss: 0.0064591895788908005 2023-01-22 18:55:44.380964: step: 924/530, loss: 0.005451238714158535 2023-01-22 18:55:45.504490: step: 928/530, loss: 0.0015243480447679758 2023-01-22 18:55:46.581949: step: 932/530, loss: 0.0034614023752510548 2023-01-22 18:55:47.672223: step: 936/530, loss: 0.00016352557577192783 2023-01-22 18:55:48.780388: step: 940/530, loss: 0.005220635328441858 2023-01-22 18:55:49.905035: step: 944/530, loss: 0.013248939998447895 2023-01-22 18:55:50.984825: step: 948/530, loss: 2.4616736027383013e-06 2023-01-22 18:55:52.093927: step: 952/530, loss: 0.008181281387805939 2023-01-22 18:55:53.184808: step: 956/530, loss: 0.0008815866895020008 2023-01-22 18:55:54.303002: step: 960/530, loss: 0.03313359245657921 2023-01-22 18:55:55.420646: step: 964/530, loss: 0.012474209070205688 2023-01-22 18:55:56.517941: step: 968/530, loss: 0.004883915651589632 2023-01-22 18:55:57.626760: step: 972/530, loss: 0.017077939584851265 2023-01-22 18:55:58.714105: step: 976/530, loss: 0.001611165120266378 2023-01-22 18:55:59.840369: step: 980/530, loss: 0.019696753472089767 2023-01-22 18:56:00.955568: step: 984/530, loss: 0.0008806691621430218 2023-01-22 18:56:02.049646: step: 988/530, loss: 0.012325761839747429 2023-01-22 18:56:03.162938: step: 992/530, loss: 0.009970033541321754 2023-01-22 18:56:04.273909: step: 996/530, loss: 0.0021491264924407005 2023-01-22 18:56:05.356937: step: 1000/530, loss: 0.0018775860080495477 2023-01-22 18:56:06.444123: step: 1004/530, loss: 0.010070179589092731 2023-01-22 18:56:07.550308: step: 1008/530, loss: 0.0173482745885849 2023-01-22 18:56:08.672288: step: 1012/530, loss: 0.004282968118786812 2023-01-22 18:56:09.770877: step: 1016/530, loss: 0.010686510242521763 2023-01-22 18:56:10.867456: step: 1020/530, loss: 0.015376301482319832 2023-01-22 18:56:11.968137: step: 1024/530, loss: 0.003207979490980506 2023-01-22 18:56:13.078440: step: 1028/530, loss: 0.004286313429474831 2023-01-22 18:56:14.165549: step: 1032/530, loss: 0.0025914551224559546 2023-01-22 18:56:15.270478: step: 1036/530, loss: 0.002869923133403063 2023-01-22 18:56:16.361275: step: 1040/530, loss: 0.0005609919899143279 2023-01-22 18:56:17.453478: step: 1044/530, loss: 0.007180202752351761 2023-01-22 18:56:18.557540: step: 1048/530, loss: 0.023522144183516502 2023-01-22 18:56:19.655633: step: 1052/530, loss: 0.004931448958814144 2023-01-22 18:56:20.773919: step: 1056/530, loss: 0.003753190627321601 2023-01-22 18:56:21.906130: step: 1060/530, loss: 0.04350333288311958 2023-01-22 18:56:23.030716: step: 1064/530, loss: 0.006681147031486034 2023-01-22 18:56:24.124739: step: 1068/530, loss: 0.013521349057555199 2023-01-22 18:56:25.222979: step: 1072/530, loss: 0.002822374925017357 2023-01-22 18:56:26.336494: step: 1076/530, loss: 0.002605520188808441 2023-01-22 18:56:27.435650: step: 1080/530, loss: 0.0033892544452100992 2023-01-22 18:56:28.536561: step: 1084/530, loss: 0.014805257320404053 2023-01-22 18:56:29.643566: step: 1088/530, loss: 0.003605550853535533 2023-01-22 18:56:30.744160: step: 1092/530, loss: 0.001872859662398696 2023-01-22 18:56:31.844521: step: 1096/530, loss: 0.01707622967660427 2023-01-22 18:56:32.950009: step: 1100/530, loss: 0.016445960849523544 2023-01-22 18:56:34.024833: step: 1104/530, loss: 0.002510062651708722 2023-01-22 18:56:35.127944: step: 1108/530, loss: 0.006677572149783373 2023-01-22 18:56:36.201365: step: 1112/530, loss: 0.006370050832629204 2023-01-22 18:56:37.339691: step: 1116/530, loss: 0.0012825154699385166 2023-01-22 18:56:38.437741: step: 1120/530, loss: 0.003444019006565213 2023-01-22 18:56:39.534126: step: 1124/530, loss: 0.025100549682974815 2023-01-22 18:56:40.633770: step: 1128/530, loss: 0.0029362936038523912 2023-01-22 18:56:41.734053: step: 1132/530, loss: 0.0027295027393847704 2023-01-22 18:56:42.823167: step: 1136/530, loss: 0.00018789245223160833 2023-01-22 18:56:43.923148: step: 1140/530, loss: 0.0003588128893170506 2023-01-22 18:56:44.989630: step: 1144/530, loss: 0.005856632255017757 2023-01-22 18:56:46.092371: step: 1148/530, loss: 0.020307840779423714 2023-01-22 18:56:47.196150: step: 1152/530, loss: 0.00271012750454247 2023-01-22 18:56:48.300120: step: 1156/530, loss: 0.010237624868750572 2023-01-22 18:56:49.390967: step: 1160/530, loss: 0.005984066519886255 2023-01-22 18:56:50.499287: step: 1164/530, loss: 0.004605032969266176 2023-01-22 18:56:51.567775: step: 1168/530, loss: 0.00023817337932996452 2023-01-22 18:56:52.684063: step: 1172/530, loss: 0.008438789285719395 2023-01-22 18:56:53.787959: step: 1176/530, loss: 0.0009418681729584932 2023-01-22 18:56:54.898454: step: 1180/530, loss: 0.00288075627759099 2023-01-22 18:56:55.981877: step: 1184/530, loss: 0.0006417831173166633 2023-01-22 18:56:57.097787: step: 1188/530, loss: 0.019675668329000473 2023-01-22 18:56:58.209781: step: 1192/530, loss: 0.0006893801037222147 2023-01-22 18:56:59.314818: step: 1196/530, loss: 0.00027176938601769507 2023-01-22 18:57:00.420811: step: 1200/530, loss: 0.0002283220674144104 2023-01-22 18:57:01.525570: step: 1204/530, loss: 0.0033687877003103495 2023-01-22 18:57:02.629830: step: 1208/530, loss: 0.0009588535176590085 2023-01-22 18:57:03.734141: step: 1212/530, loss: 0.007998911663889885 2023-01-22 18:57:04.811535: step: 1216/530, loss: 0.004501916468143463 2023-01-22 18:57:05.914794: step: 1220/530, loss: 0.0006718040094710886 2023-01-22 18:57:07.000638: step: 1224/530, loss: 0.04154327139258385 2023-01-22 18:57:08.101924: step: 1228/530, loss: 0.0036498745903372765 2023-01-22 18:57:09.187979: step: 1232/530, loss: 0.0016898217145353556 2023-01-22 18:57:10.280506: step: 1236/530, loss: 0.0019241824047639966 2023-01-22 18:57:11.382577: step: 1240/530, loss: 0.0027863839641213417 2023-01-22 18:57:12.480785: step: 1244/530, loss: 0.0050810822285711765 2023-01-22 18:57:13.614377: step: 1248/530, loss: 0.0037873501423746347 2023-01-22 18:57:14.726372: step: 1252/530, loss: 0.0018542238976806402 2023-01-22 18:57:15.816841: step: 1256/530, loss: 0.006123093888163567 2023-01-22 18:57:16.936870: step: 1260/530, loss: 0.002410774352028966 2023-01-22 18:57:18.039284: step: 1264/530, loss: 0.0034158991184085608 2023-01-22 18:57:19.138557: step: 1268/530, loss: 0.0017858152277767658 2023-01-22 18:57:20.256833: step: 1272/530, loss: 0.0061688050627708435 2023-01-22 18:57:21.348378: step: 1276/530, loss: 0.00449812738224864 2023-01-22 18:57:22.471532: step: 1280/530, loss: 0.0034192863386124372 2023-01-22 18:57:23.568859: step: 1284/530, loss: 0.0036674761213362217 2023-01-22 18:57:24.676817: step: 1288/530, loss: 0.011822589673101902 2023-01-22 18:57:25.803084: step: 1292/530, loss: 0.016700327396392822 2023-01-22 18:57:26.873742: step: 1296/530, loss: 0.0001120849046856165 2023-01-22 18:57:28.009307: step: 1300/530, loss: 0.005160850007086992 2023-01-22 18:57:29.106620: step: 1304/530, loss: 0.0035220228601247072 2023-01-22 18:57:30.197416: step: 1308/530, loss: 0.009390189312398434 2023-01-22 18:57:31.284318: step: 1312/530, loss: 0.001900652889162302 2023-01-22 18:57:32.403508: step: 1316/530, loss: 0.005975495558232069 2023-01-22 18:57:33.488350: step: 1320/530, loss: 0.00012547499500215054 2023-01-22 18:57:34.588557: step: 1324/530, loss: 0.007042139768600464 2023-01-22 18:57:35.696186: step: 1328/530, loss: 0.013127412647008896 2023-01-22 18:57:36.801861: step: 1332/530, loss: 0.0012310559395700693 2023-01-22 18:57:37.891878: step: 1336/530, loss: 0.00017637229757383466 2023-01-22 18:57:38.991701: step: 1340/530, loss: 0.0002910773328039795 2023-01-22 18:57:40.105713: step: 1344/530, loss: 0.050613563507795334 2023-01-22 18:57:41.189479: step: 1348/530, loss: 8.155624527717009e-05 2023-01-22 18:57:42.302476: step: 1352/530, loss: 0.003610956249758601 2023-01-22 18:57:43.409083: step: 1356/530, loss: 0.011948911473155022 2023-01-22 18:57:44.515176: step: 1360/530, loss: 0.006423926446586847 2023-01-22 18:57:45.623373: step: 1364/530, loss: 0.004793121479451656 2023-01-22 18:57:46.746233: step: 1368/530, loss: 0.027611060068011284 2023-01-22 18:57:47.849268: step: 1372/530, loss: 0.0010081022046506405 2023-01-22 18:57:48.958666: step: 1376/530, loss: 0.007629277650266886 2023-01-22 18:57:50.061087: step: 1380/530, loss: 4.365411768958438e-06 2023-01-22 18:57:51.166473: step: 1384/530, loss: 0.002638371894136071 2023-01-22 18:57:52.252639: step: 1388/530, loss: 0.015869446098804474 2023-01-22 18:57:53.379197: step: 1392/530, loss: 0.00021729881700593978 2023-01-22 18:57:54.488230: step: 1396/530, loss: 0.0028890392277389765 2023-01-22 18:57:55.578333: step: 1400/530, loss: 0.0009449466015212238 2023-01-22 18:57:56.696339: step: 1404/530, loss: 0.000890866038389504 2023-01-22 18:57:57.795334: step: 1408/530, loss: 0.02000340074300766 2023-01-22 18:57:58.893536: step: 1412/530, loss: 0.017198355868458748 2023-01-22 18:58:00.003185: step: 1416/530, loss: 0.0026251724921166897 2023-01-22 18:58:01.101171: step: 1420/530, loss: 0.011111374013125896 2023-01-22 18:58:02.176667: step: 1424/530, loss: 0.0008446262800134718 2023-01-22 18:58:03.294407: step: 1428/530, loss: 0.0004870123811997473 2023-01-22 18:58:04.405304: step: 1432/530, loss: 0.008600347675383091 2023-01-22 18:58:05.499725: step: 1436/530, loss: 0.002035481622442603 2023-01-22 18:58:06.622037: step: 1440/530, loss: 0.007148706819862127 2023-01-22 18:58:07.730943: step: 1444/530, loss: 0.005883886478841305 2023-01-22 18:58:08.838755: step: 1448/530, loss: 0.0025332090444862843 2023-01-22 18:58:09.916612: step: 1452/530, loss: 0.003139760810881853 2023-01-22 18:58:11.008482: step: 1456/530, loss: 0.00416307058185339 2023-01-22 18:58:12.126456: step: 1460/530, loss: 0.005314046982675791 2023-01-22 18:58:13.226662: step: 1464/530, loss: 0.008616367354989052 2023-01-22 18:58:14.313997: step: 1468/530, loss: 0.005100147798657417 2023-01-22 18:58:15.405318: step: 1472/530, loss: 0.0039847660809755325 2023-01-22 18:58:16.512461: step: 1476/530, loss: 0.0003103814960923046 2023-01-22 18:58:17.586666: step: 1480/530, loss: 0.00010832703992491588 2023-01-22 18:58:18.701686: step: 1484/530, loss: 0.019363101571798325 2023-01-22 18:58:19.784076: step: 1488/530, loss: 0.0038264915347099304 2023-01-22 18:58:20.866063: step: 1492/530, loss: 0.005332478322088718 2023-01-22 18:58:21.943358: step: 1496/530, loss: 0.0026007560081779957 2023-01-22 18:58:23.039766: step: 1500/530, loss: 0.006084011867642403 2023-01-22 18:58:24.135580: step: 1504/530, loss: 0.018632173538208008 2023-01-22 18:58:25.270120: step: 1508/530, loss: 0.0025714419316500425 2023-01-22 18:58:26.372787: step: 1512/530, loss: 0.0012076179264113307 2023-01-22 18:58:27.452944: step: 1516/530, loss: 0.0006937332800589502 2023-01-22 18:58:28.553531: step: 1520/530, loss: 0.00013510914868675172 2023-01-22 18:58:29.660375: step: 1524/530, loss: 0.019041750580072403 2023-01-22 18:58:30.760554: step: 1528/530, loss: 0.01660768687725067 2023-01-22 18:58:31.850879: step: 1532/530, loss: 0.0 2023-01-22 18:58:32.947020: step: 1536/530, loss: 0.00801519863307476 2023-01-22 18:58:34.075129: step: 1540/530, loss: 0.0038964995183050632 2023-01-22 18:58:35.170374: step: 1544/530, loss: 0.011827089823782444 2023-01-22 18:58:36.258512: step: 1548/530, loss: 0.0007869135588407516 2023-01-22 18:58:37.367282: step: 1552/530, loss: 0.010387184098362923 2023-01-22 18:58:38.464038: step: 1556/530, loss: 0.021088551729917526 2023-01-22 18:58:39.576978: step: 1560/530, loss: 0.0002866918803192675 2023-01-22 18:58:40.673557: step: 1564/530, loss: 0.004804663360118866 2023-01-22 18:58:41.805028: step: 1568/530, loss: 0.0076960292644798756 2023-01-22 18:58:42.894722: step: 1572/530, loss: 0.00040203926619142294 2023-01-22 18:58:44.005140: step: 1576/530, loss: 0.002767186611890793 2023-01-22 18:58:45.112988: step: 1580/530, loss: 0.0070724464021623135 2023-01-22 18:58:46.214025: step: 1584/530, loss: 0.006301302928477526 2023-01-22 18:58:47.303428: step: 1588/530, loss: 0.0021566362120211124 2023-01-22 18:58:48.419266: step: 1592/530, loss: 0.0001665118761593476 2023-01-22 18:58:49.549496: step: 1596/530, loss: 0.00469922972843051 2023-01-22 18:58:50.658929: step: 1600/530, loss: 0.01255431491881609 2023-01-22 18:58:51.753372: step: 1604/530, loss: 0.008955096825957298 2023-01-22 18:58:52.841944: step: 1608/530, loss: 0.0024435240775346756 2023-01-22 18:58:53.932807: step: 1612/530, loss: 0.0035248163621872663 2023-01-22 18:58:55.010884: step: 1616/530, loss: 0.0060799927450716496 2023-01-22 18:58:56.132506: step: 1620/530, loss: 0.0015154475113376975 2023-01-22 18:58:57.213306: step: 1624/530, loss: 0.002236857544630766 2023-01-22 18:58:58.335096: step: 1628/530, loss: 0.003611978143453598 2023-01-22 18:58:59.447872: step: 1632/530, loss: 0.004215634427964687 2023-01-22 18:59:00.561697: step: 1636/530, loss: 0.0055053094401955605 2023-01-22 18:59:01.682221: step: 1640/530, loss: 0.003384184557944536 2023-01-22 18:59:02.785537: step: 1644/530, loss: 0.007361925207078457 2023-01-22 18:59:03.869807: step: 1648/530, loss: 0.006534917745739222 2023-01-22 18:59:04.956334: step: 1652/530, loss: 0.030968040227890015 2023-01-22 18:59:06.070941: step: 1656/530, loss: 0.003852076129987836 2023-01-22 18:59:07.163750: step: 1660/530, loss: 0.002589681651443243 2023-01-22 18:59:08.269982: step: 1664/530, loss: 0.0044108061119914055 2023-01-22 18:59:09.370073: step: 1668/530, loss: 0.037874381989240646 2023-01-22 18:59:10.477034: step: 1672/530, loss: 0.005340332165360451 2023-01-22 18:59:11.574211: step: 1676/530, loss: 0.001252803485840559 2023-01-22 18:59:12.659061: step: 1680/530, loss: 0.0023055358324199915 2023-01-22 18:59:13.745891: step: 1684/530, loss: 0.005429337732493877 2023-01-22 18:59:14.865739: step: 1688/530, loss: 0.001402071793563664 2023-01-22 18:59:15.970415: step: 1692/530, loss: 0.003628536593168974 2023-01-22 18:59:17.066712: step: 1696/530, loss: 0.0034396806731820107 2023-01-22 18:59:18.162722: step: 1700/530, loss: 0.012472940608859062 2023-01-22 18:59:19.252196: step: 1704/530, loss: 0.017810627818107605 2023-01-22 18:59:20.350190: step: 1708/530, loss: 0.00910043716430664 2023-01-22 18:59:21.422532: step: 1712/530, loss: 0.012113492004573345 2023-01-22 18:59:22.508239: step: 1716/530, loss: 0.027594799175858498 2023-01-22 18:59:23.603145: step: 1720/530, loss: 0.007864712737500668 2023-01-22 18:59:24.698427: step: 1724/530, loss: 0.010359127074480057 2023-01-22 18:59:25.800369: step: 1728/530, loss: 0.004951147828251123 2023-01-22 18:59:26.899262: step: 1732/530, loss: 0.010661778971552849 2023-01-22 18:59:28.013877: step: 1736/530, loss: 0.04660448431968689 2023-01-22 18:59:29.137949: step: 1740/530, loss: 0.023057512938976288 2023-01-22 18:59:30.254467: step: 1744/530, loss: 0.0026987886521965265 2023-01-22 18:59:31.387143: step: 1748/530, loss: 0.008165402337908745 2023-01-22 18:59:32.520111: step: 1752/530, loss: 0.008982207626104355 2023-01-22 18:59:33.616393: step: 1756/530, loss: 0.002726080594584346 2023-01-22 18:59:34.725172: step: 1760/530, loss: 0.003132391953840852 2023-01-22 18:59:35.813132: step: 1764/530, loss: 0.0003318925737403333 2023-01-22 18:59:36.901700: step: 1768/530, loss: 0.0010938697960227728 2023-01-22 18:59:37.996714: step: 1772/530, loss: 0.016663808375597 2023-01-22 18:59:39.104515: step: 1776/530, loss: 0.007776834536343813 2023-01-22 18:59:40.182220: step: 1780/530, loss: 0.001584175624884665 2023-01-22 18:59:41.274781: step: 1784/530, loss: 0.00040965297375805676 2023-01-22 18:59:42.372560: step: 1788/530, loss: 0.009385798126459122 2023-01-22 18:59:43.472355: step: 1792/530, loss: 0.0006889718351885676 2023-01-22 18:59:44.577768: step: 1796/530, loss: 0.018294749781489372 2023-01-22 18:59:45.675065: step: 1800/530, loss: 0.0026774355210363865 2023-01-22 18:59:46.739223: step: 1804/530, loss: 0.015958787873387337 2023-01-22 18:59:47.847157: step: 1808/530, loss: 0.0016962961526587605 2023-01-22 18:59:48.955578: step: 1812/530, loss: 0.005244984291493893 2023-01-22 18:59:50.061208: step: 1816/530, loss: 0.0008689347305335104 2023-01-22 18:59:51.166590: step: 1820/530, loss: 0.003296517301350832 2023-01-22 18:59:52.259402: step: 1824/530, loss: 0.0016393533442169428 2023-01-22 18:59:53.358858: step: 1828/530, loss: 0.0016171283787116408 2023-01-22 18:59:54.454733: step: 1832/530, loss: 0.01213243417441845 2023-01-22 18:59:55.529972: step: 1836/530, loss: 5.0799677410395816e-05 2023-01-22 18:59:56.622978: step: 1840/530, loss: 0.00038332241820171475 2023-01-22 18:59:57.711746: step: 1844/530, loss: 0.008795974776148796 2023-01-22 18:59:58.797870: step: 1848/530, loss: 0.0019124295795336366 2023-01-22 18:59:59.932625: step: 1852/530, loss: 0.006140131037682295 2023-01-22 19:00:01.035342: step: 1856/530, loss: 0.002668975852429867 2023-01-22 19:00:02.142453: step: 1860/530, loss: 0.007928646169602871 2023-01-22 19:00:03.266500: step: 1864/530, loss: 0.005748241674154997 2023-01-22 19:00:04.365902: step: 1868/530, loss: 0.00027306514675728977 2023-01-22 19:00:05.461933: step: 1872/530, loss: 0.001409861957654357 2023-01-22 19:00:06.583192: step: 1876/530, loss: 0.008886498399078846 2023-01-22 19:00:07.675841: step: 1880/530, loss: 0.0022387877106666565 2023-01-22 19:00:08.765095: step: 1884/530, loss: 0.0016016238369047642 2023-01-22 19:00:09.876724: step: 1888/530, loss: 0.001985857030376792 2023-01-22 19:00:11.004727: step: 1892/530, loss: 0.0008222759934142232 2023-01-22 19:00:12.122150: step: 1896/530, loss: 0.002720050048083067 2023-01-22 19:00:13.228106: step: 1900/530, loss: 0.012504915706813335 2023-01-22 19:00:14.326829: step: 1904/530, loss: 0.004875602200627327 2023-01-22 19:00:15.413211: step: 1908/530, loss: 0.0031856712885200977 2023-01-22 19:00:16.514605: step: 1912/530, loss: 0.002739051589742303 2023-01-22 19:00:17.601525: step: 1916/530, loss: 0.022072207182645798 2023-01-22 19:00:18.692050: step: 1920/530, loss: 0.004854911006987095 2023-01-22 19:00:19.776447: step: 1924/530, loss: 0.0002982405130751431 2023-01-22 19:00:20.859433: step: 1928/530, loss: 0.0053671193309128284 2023-01-22 19:00:21.959895: step: 1932/530, loss: 0.007114367559552193 2023-01-22 19:00:23.041042: step: 1936/530, loss: 0.0012457175180315971 2023-01-22 19:00:24.130325: step: 1940/530, loss: 0.006959805730730295 2023-01-22 19:00:25.233457: step: 1944/530, loss: 0.001081329770386219 2023-01-22 19:00:26.357848: step: 1948/530, loss: 0.0066568139009177685 2023-01-22 19:00:27.481498: step: 1952/530, loss: 0.01788986846804619 2023-01-22 19:00:28.561514: step: 1956/530, loss: 0.007602077443152666 2023-01-22 19:00:29.669470: step: 1960/530, loss: 0.011420664377510548 2023-01-22 19:00:30.750002: step: 1964/530, loss: 0.003076155437156558 2023-01-22 19:00:31.837225: step: 1968/530, loss: 0.0017775805899873376 2023-01-22 19:00:32.933760: step: 1972/530, loss: 0.0011716056615114212 2023-01-22 19:00:34.000623: step: 1976/530, loss: 0.0007368326769210398 2023-01-22 19:00:35.101171: step: 1980/530, loss: 0.013338204473257065 2023-01-22 19:00:36.187243: step: 1984/530, loss: 0.00042962783481925726 2023-01-22 19:00:37.279642: step: 1988/530, loss: 0.00039271271089091897 2023-01-22 19:00:38.378423: step: 1992/530, loss: 0.0011719658505171537 2023-01-22 19:00:39.477518: step: 1996/530, loss: 0.003937747795134783 2023-01-22 19:00:40.589278: step: 2000/530, loss: 0.004414998460561037 2023-01-22 19:00:41.681272: step: 2004/530, loss: 0.00075063097756356 2023-01-22 19:00:42.809049: step: 2008/530, loss: 0.007871423847973347 2023-01-22 19:00:43.940203: step: 2012/530, loss: 0.01167930755764246 2023-01-22 19:00:45.043690: step: 2016/530, loss: 0.009887666441500187 2023-01-22 19:00:46.146555: step: 2020/530, loss: 0.0049647558480501175 2023-01-22 19:00:47.251721: step: 2024/530, loss: 0.0007859620964154601 2023-01-22 19:00:48.348279: step: 2028/530, loss: 0.014205127954483032 2023-01-22 19:00:49.432527: step: 2032/530, loss: 0.004115665331482887 2023-01-22 19:00:50.541681: step: 2036/530, loss: 0.0032271044328808784 2023-01-22 19:00:51.628404: step: 2040/530, loss: 0.004548276774585247 2023-01-22 19:00:52.731351: step: 2044/530, loss: 0.004282260313630104 2023-01-22 19:00:53.824094: step: 2048/530, loss: 0.0037071609403938055 2023-01-22 19:00:54.905498: step: 2052/530, loss: 0.0003640760842245072 2023-01-22 19:00:56.017968: step: 2056/530, loss: 0.0005618956638500094 2023-01-22 19:00:57.151803: step: 2060/530, loss: 0.0018802088452503085 2023-01-22 19:00:58.245124: step: 2064/530, loss: 0.0008161062141880393 2023-01-22 19:00:59.314439: step: 2068/530, loss: 0.0023067700676620007 2023-01-22 19:01:00.403480: step: 2072/530, loss: 0.005230557173490524 2023-01-22 19:01:01.490185: step: 2076/530, loss: 0.009671683423221111 2023-01-22 19:01:02.595733: step: 2080/530, loss: 0.00613103061914444 2023-01-22 19:01:03.682648: step: 2084/530, loss: 0.011765551753342152 2023-01-22 19:01:04.796101: step: 2088/530, loss: 0.0006902336026541889 2023-01-22 19:01:05.880965: step: 2092/530, loss: 0.009412631392478943 2023-01-22 19:01:06.983806: step: 2096/530, loss: 0.0038881096988916397 2023-01-22 19:01:08.108397: step: 2100/530, loss: 0.005062987562268972 2023-01-22 19:01:09.216260: step: 2104/530, loss: 0.005288320127874613 2023-01-22 19:01:10.322693: step: 2108/530, loss: 0.001456351368688047 2023-01-22 19:01:11.418263: step: 2112/530, loss: 0.006281753536313772 2023-01-22 19:01:12.535101: step: 2116/530, loss: 0.03574305772781372 2023-01-22 19:01:13.616189: step: 2120/530, loss: 0.001871609129011631 ================================================== Loss: 0.006 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33460531297324586, 'r': 0.3593673759826511, 'f1': 0.3465445693373415}, 'combined': 0.2553486300380411, 'stategy': 1, 'epoch': 9} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33482382929590704, 'r': 0.2868026074878887, 'f1': 0.30895837631353806}, 'combined': 0.19187941265788155, 'stategy': 1, 'epoch': 9} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3463071521960457, 'r': 0.3436786349118252, 'f1': 0.3449878868543464}, 'combined': 0.2542016008400447, 'stategy': 1, 'epoch': 9} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.32384618181262975, 'r': 0.2895716600975443, 'f1': 0.30575138209777264}, 'combined': 0.18988770046072198, 'stategy': 1, 'epoch': 9} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33781331386195423, 'r': 0.3275571221697507, 'f1': 0.3326061722224636}, 'combined': 0.24507823216392052, 'stategy': 1, 'epoch': 9} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34849030703267064, 'r': 0.2958555420020698, 'f1': 0.3200231329931626}, 'combined': 0.1987512089115431, 'stategy': 1, 'epoch': 9} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 9} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.35294117647058826, 'r': 0.5217391304347826, 'f1': 0.4210526315789474}, 'combined': 0.2105263157894737, 'stategy': 1, 'epoch': 9} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 9} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 10 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 19:03:42.929405: step: 4/530, loss: 0.0034415009431540966 2023-01-22 19:03:44.036447: step: 8/530, loss: 0.0018855099333450198 2023-01-22 19:03:45.121524: step: 12/530, loss: 0.0025820701848715544 2023-01-22 19:03:46.213949: step: 16/530, loss: 0.005389011465013027 2023-01-22 19:03:47.286657: step: 20/530, loss: 0.0017314772121608257 2023-01-22 19:03:48.377540: step: 24/530, loss: 0.001437419094145298 2023-01-22 19:03:49.434708: step: 28/530, loss: 0.004753878340125084 2023-01-22 19:03:50.523041: step: 32/530, loss: 0.0023134828079491854 2023-01-22 19:03:51.605665: step: 36/530, loss: 0.0013290735660120845 2023-01-22 19:03:52.697941: step: 40/530, loss: 0.0027263276278972626 2023-01-22 19:03:53.793757: step: 44/530, loss: 0.009244153276085854 2023-01-22 19:03:54.888213: step: 48/530, loss: 0.0011075136717408895 2023-01-22 19:03:55.966448: step: 52/530, loss: 0.0011879028752446175 2023-01-22 19:03:57.044234: step: 56/530, loss: 0.011863050051033497 2023-01-22 19:03:58.123534: step: 60/530, loss: 0.0016303241718560457 2023-01-22 19:03:59.216665: step: 64/530, loss: 0.002244720235466957 2023-01-22 19:04:00.308007: step: 68/530, loss: 0.00011352369619999081 2023-01-22 19:04:01.386460: step: 72/530, loss: 0.00046751886839047074 2023-01-22 19:04:02.466169: step: 76/530, loss: 0.004899282474070787 2023-01-22 19:04:03.535271: step: 80/530, loss: 0.0033934323582798243 2023-01-22 19:04:04.642577: step: 84/530, loss: 0.005008421838283539 2023-01-22 19:04:05.710466: step: 88/530, loss: 0.0002878271334338933 2023-01-22 19:04:06.804993: step: 92/530, loss: 0.00558737525716424 2023-01-22 19:04:07.906578: step: 96/530, loss: 0.0093363206833601 2023-01-22 19:04:09.017536: step: 100/530, loss: 0.0032868129201233387 2023-01-22 19:04:10.079771: step: 104/530, loss: 0.004269672092050314 2023-01-22 19:04:11.166749: step: 108/530, loss: 0.012570032849907875 2023-01-22 19:04:12.284389: step: 112/530, loss: 0.0158297847956419 2023-01-22 19:04:13.391763: step: 116/530, loss: 0.0010067452676594257 2023-01-22 19:04:14.476326: step: 120/530, loss: 0.0024046064354479313 2023-01-22 19:04:15.557296: step: 124/530, loss: 0.00044459145283326507 2023-01-22 19:04:16.648410: step: 128/530, loss: 0.010600504465401173 2023-01-22 19:04:17.737925: step: 132/530, loss: 0.00039859768003225327 2023-01-22 19:04:18.842752: step: 136/530, loss: 0.003415749641135335 2023-01-22 19:04:19.945401: step: 140/530, loss: 0.028947310522198677 2023-01-22 19:04:21.025594: step: 144/530, loss: 0.0018326163990423083 2023-01-22 19:04:22.123701: step: 148/530, loss: 0.004080368671566248 2023-01-22 19:04:23.206229: step: 152/530, loss: 0.0005264051724225283 2023-01-22 19:04:24.289217: step: 156/530, loss: 0.0029352109413594007 2023-01-22 19:04:25.389647: step: 160/530, loss: 0.008986947126686573 2023-01-22 19:04:26.477640: step: 164/530, loss: 0.0053579979576170444 2023-01-22 19:04:27.597352: step: 168/530, loss: 0.0034974587615579367 2023-01-22 19:04:28.694047: step: 172/530, loss: 0.009433495812118053 2023-01-22 19:04:29.778559: step: 176/530, loss: 0.0007090445724315941 2023-01-22 19:04:30.880717: step: 180/530, loss: 0.00040775485103949904 2023-01-22 19:04:31.966969: step: 184/530, loss: 0.0025965918321162462 2023-01-22 19:04:33.065641: step: 188/530, loss: 0.0002931267081294209 2023-01-22 19:04:34.168476: step: 192/530, loss: 0.005676877684891224 2023-01-22 19:04:35.278570: step: 196/530, loss: 0.010167280212044716 2023-01-22 19:04:36.372417: step: 200/530, loss: 0.0068588582798838615 2023-01-22 19:04:37.450088: step: 204/530, loss: 0.0009279776131734252 2023-01-22 19:04:38.534040: step: 208/530, loss: 0.003876051167026162 2023-01-22 19:04:39.617525: step: 212/530, loss: 0.0012742475373670459 2023-01-22 19:04:40.724073: step: 216/530, loss: 0.007744040340185165 2023-01-22 19:04:41.833163: step: 220/530, loss: 0.006425646599382162 2023-01-22 19:04:42.940059: step: 224/530, loss: 0.00498602818697691 2023-01-22 19:04:44.044219: step: 228/530, loss: 0.0026386925019323826 2023-01-22 19:04:45.158766: step: 232/530, loss: 0.007540892343968153 2023-01-22 19:04:46.241651: step: 236/530, loss: 0.011274152435362339 2023-01-22 19:04:47.318227: step: 240/530, loss: 0.028672195971012115 2023-01-22 19:04:48.410865: step: 244/530, loss: 0.01065274141728878 2023-01-22 19:04:49.505280: step: 248/530, loss: 0.002114612376317382 2023-01-22 19:04:50.610257: step: 252/530, loss: 0.0017169505590572953 2023-01-22 19:04:51.706875: step: 256/530, loss: 0.006198923569172621 2023-01-22 19:04:52.787466: step: 260/530, loss: 0.0001791394461179152 2023-01-22 19:04:53.852330: step: 264/530, loss: 0.011137833818793297 2023-01-22 19:04:54.945693: step: 268/530, loss: 0.0015613245777785778 2023-01-22 19:04:56.024716: step: 272/530, loss: 0.0019488499965518713 2023-01-22 19:04:57.123894: step: 276/530, loss: 0.0012817097594961524 2023-01-22 19:04:58.221919: step: 280/530, loss: 0.0018022364238277078 2023-01-22 19:04:59.310504: step: 284/530, loss: 0.0019409205997362733 2023-01-22 19:05:00.401658: step: 288/530, loss: 0.002587040653452277 2023-01-22 19:05:01.518481: step: 292/530, loss: 0.004167493898421526 2023-01-22 19:05:02.617196: step: 296/530, loss: 0.004530603066086769 2023-01-22 19:05:03.701139: step: 300/530, loss: 0.000620887556578964 2023-01-22 19:05:04.820567: step: 304/530, loss: 0.0154774384573102 2023-01-22 19:05:05.921634: step: 308/530, loss: 0.00944730918854475 2023-01-22 19:05:07.031953: step: 312/530, loss: 0.0012708025751635432 2023-01-22 19:05:08.148351: step: 316/530, loss: 0.008497222326695919 2023-01-22 19:05:09.221898: step: 320/530, loss: 0.014150462113320827 2023-01-22 19:05:10.303166: step: 324/530, loss: 0.0027164421044290066 2023-01-22 19:05:11.392134: step: 328/530, loss: 0.008109225891530514 2023-01-22 19:05:12.487240: step: 332/530, loss: 0.0010222382843494415 2023-01-22 19:05:13.568862: step: 336/530, loss: 0.004857663996517658 2023-01-22 19:05:14.662591: step: 340/530, loss: 0.005858488846570253 2023-01-22 19:05:15.750975: step: 344/530, loss: 0.003807384055107832 2023-01-22 19:05:16.842464: step: 348/530, loss: 0.0032293195836246014 2023-01-22 19:05:17.923777: step: 352/530, loss: 0.003018673975020647 2023-01-22 19:05:19.011447: step: 356/530, loss: 0.029335839673876762 2023-01-22 19:05:20.110328: step: 360/530, loss: 0.01103054266422987 2023-01-22 19:05:21.194925: step: 364/530, loss: 0.0027374725323170424 2023-01-22 19:05:22.288237: step: 368/530, loss: 0.0012658733176067472 2023-01-22 19:05:23.383267: step: 372/530, loss: 0.004912860691547394 2023-01-22 19:05:24.476794: step: 376/530, loss: 0.002985097002238035 2023-01-22 19:05:25.578617: step: 380/530, loss: 0.005533963441848755 2023-01-22 19:05:26.682388: step: 384/530, loss: 0.0036693972069770098 2023-01-22 19:05:27.758268: step: 388/530, loss: 0.0030343160033226013 2023-01-22 19:05:28.842317: step: 392/530, loss: 0.0002340084611205384 2023-01-22 19:05:29.953484: step: 396/530, loss: 0.002366960048675537 2023-01-22 19:05:31.044353: step: 400/530, loss: 0.0045024738647043705 2023-01-22 19:05:32.127283: step: 404/530, loss: 0.0006814567022956908 2023-01-22 19:05:33.224770: step: 408/530, loss: 0.001246783067472279 2023-01-22 19:05:34.298967: step: 412/530, loss: 0.0031921551562845707 2023-01-22 19:05:35.400524: step: 416/530, loss: 0.0038193792570382357 2023-01-22 19:05:36.505472: step: 420/530, loss: 0.0016046573873609304 2023-01-22 19:05:37.613538: step: 424/530, loss: 0.004700668156147003 2023-01-22 19:05:38.726322: step: 428/530, loss: 0.008702094666659832 2023-01-22 19:05:39.826201: step: 432/530, loss: 0.01003299094736576 2023-01-22 19:05:40.932025: step: 436/530, loss: 0.018044637516140938 2023-01-22 19:05:42.039910: step: 440/530, loss: 9.396607492817566e-05 2023-01-22 19:05:43.143897: step: 444/530, loss: 0.012194762006402016 2023-01-22 19:05:44.225682: step: 448/530, loss: 0.00013641318946611136 2023-01-22 19:05:45.340882: step: 452/530, loss: 0.004846340976655483 2023-01-22 19:05:46.435902: step: 456/530, loss: 9.918484283844009e-05 2023-01-22 19:05:47.523046: step: 460/530, loss: 0.00012301348033361137 2023-01-22 19:05:48.619912: step: 464/530, loss: 0.0019925881642848253 2023-01-22 19:05:49.701613: step: 468/530, loss: 0.004436699207872152 2023-01-22 19:05:50.786391: step: 472/530, loss: 0.0027862873394042253 2023-01-22 19:05:51.895593: step: 476/530, loss: 0.008916843682527542 2023-01-22 19:05:52.987658: step: 480/530, loss: 0.002100105630233884 2023-01-22 19:05:54.091748: step: 484/530, loss: 0.003695284016430378 2023-01-22 19:05:55.191110: step: 488/530, loss: 0.00017014855984598398 2023-01-22 19:05:56.307422: step: 492/530, loss: 0.0018134398851543665 2023-01-22 19:05:57.422514: step: 496/530, loss: 0.0025519183836877346 2023-01-22 19:05:58.510159: step: 500/530, loss: 0.00042375936754979193 2023-01-22 19:05:59.635164: step: 504/530, loss: 0.01567401923239231 2023-01-22 19:06:00.727348: step: 508/530, loss: 0.0005772035801783204 2023-01-22 19:06:01.833263: step: 512/530, loss: 0.0016135585028678179 2023-01-22 19:06:02.924038: step: 516/530, loss: 0.002485134871676564 2023-01-22 19:06:04.033251: step: 520/530, loss: 0.012817529030144215 2023-01-22 19:06:05.126539: step: 524/530, loss: 0.004903607070446014 2023-01-22 19:06:06.223314: step: 528/530, loss: 0.007648189552128315 2023-01-22 19:06:07.340079: step: 532/530, loss: 0.003112268866971135 2023-01-22 19:06:08.463191: step: 536/530, loss: 0.017006365582346916 2023-01-22 19:06:09.554491: step: 540/530, loss: 0.00040519481990486383 2023-01-22 19:06:10.639498: step: 544/530, loss: 0.004090775735676289 2023-01-22 19:06:11.742834: step: 548/530, loss: 0.0016456767916679382 2023-01-22 19:06:12.822444: step: 552/530, loss: 0.01644858345389366 2023-01-22 19:06:13.918464: step: 556/530, loss: 0.002307191025465727 2023-01-22 19:06:15.006997: step: 560/530, loss: 0.006284062750637531 2023-01-22 19:06:16.104921: step: 564/530, loss: 0.0027016112580895424 2023-01-22 19:06:17.200369: step: 568/530, loss: 0.005701027810573578 2023-01-22 19:06:18.308780: step: 572/530, loss: 0.00931558758020401 2023-01-22 19:06:19.400795: step: 576/530, loss: 0.0020256154239177704 2023-01-22 19:06:20.493048: step: 580/530, loss: 0.023163888603448868 2023-01-22 19:06:21.567485: step: 584/530, loss: 0.0002538264961913228 2023-01-22 19:06:22.661167: step: 588/530, loss: 0.008892915211617947 2023-01-22 19:06:23.749662: step: 592/530, loss: 0.007267594803124666 2023-01-22 19:06:24.841521: step: 596/530, loss: 0.000707216328009963 2023-01-22 19:06:25.936943: step: 600/530, loss: 0.0036801721435040236 2023-01-22 19:06:27.033000: step: 604/530, loss: 0.004926749505102634 2023-01-22 19:06:28.150768: step: 608/530, loss: 0.0033411975018680096 2023-01-22 19:06:29.244573: step: 612/530, loss: 0.0029005182441323996 2023-01-22 19:06:30.343051: step: 616/530, loss: 0.0014471672475337982 2023-01-22 19:06:31.441069: step: 620/530, loss: 0.00519148726016283 2023-01-22 19:06:32.552082: step: 624/530, loss: 0.004915914963930845 2023-01-22 19:06:33.681380: step: 628/530, loss: 0.0110006770119071 2023-01-22 19:06:34.777390: step: 632/530, loss: 0.0012852144427597523 2023-01-22 19:06:35.862254: step: 636/530, loss: 0.00438058702275157 2023-01-22 19:06:36.943202: step: 640/530, loss: 0.00918579287827015 2023-01-22 19:06:38.056530: step: 644/530, loss: 0.0017917025834321976 2023-01-22 19:06:39.166001: step: 648/530, loss: 0.001813714043237269 2023-01-22 19:06:40.259696: step: 652/530, loss: 0.0052543762139976025 2023-01-22 19:06:41.367736: step: 656/530, loss: 0.0009003058657981455 2023-01-22 19:06:42.467500: step: 660/530, loss: 0.004665522836148739 2023-01-22 19:06:43.565036: step: 664/530, loss: 0.0020169091876596212 2023-01-22 19:06:44.656992: step: 668/530, loss: 0.0054077086970210075 2023-01-22 19:06:45.751189: step: 672/530, loss: 0.0017569754272699356 2023-01-22 19:06:46.842219: step: 676/530, loss: 0.0008131520007736981 2023-01-22 19:06:47.928736: step: 680/530, loss: 0.00010416947770863771 2023-01-22 19:06:49.025810: step: 684/530, loss: 0.0018142632907256484 2023-01-22 19:06:50.148027: step: 688/530, loss: 0.006656542420387268 2023-01-22 19:06:51.263974: step: 692/530, loss: 0.0005797837511636317 2023-01-22 19:06:52.354168: step: 696/530, loss: 0.0007885689847171307 2023-01-22 19:06:53.465413: step: 700/530, loss: 0.052023597061634064 2023-01-22 19:06:54.550277: step: 704/530, loss: 0.005453550722450018 2023-01-22 19:06:55.656247: step: 708/530, loss: 0.007839587517082691 2023-01-22 19:06:56.736167: step: 712/530, loss: 0.0009000131394714117 2023-01-22 19:06:57.811155: step: 716/530, loss: 0.00037429857184179127 2023-01-22 19:06:58.905106: step: 720/530, loss: 0.004768033046275377 2023-01-22 19:07:00.026529: step: 724/530, loss: 0.0070826830342411995 2023-01-22 19:07:01.129542: step: 728/530, loss: 0.0048217205330729485 2023-01-22 19:07:02.241619: step: 732/530, loss: 0.0013208432355895638 2023-01-22 19:07:03.337950: step: 736/530, loss: 0.00471006752923131 2023-01-22 19:07:04.444457: step: 740/530, loss: 0.0016549668507650495 2023-01-22 19:07:05.540900: step: 744/530, loss: 0.004077339079231024 2023-01-22 19:07:06.629528: step: 748/530, loss: 0.003988637588918209 2023-01-22 19:07:07.710649: step: 752/530, loss: 0.002860607346519828 2023-01-22 19:07:08.792615: step: 756/530, loss: 0.00011697473382810131 2023-01-22 19:07:09.890707: step: 760/530, loss: 0.0002914362703450024 2023-01-22 19:07:11.009018: step: 764/530, loss: 0.005991601850837469 2023-01-22 19:07:12.117105: step: 768/530, loss: 0.0004237417597323656 2023-01-22 19:07:13.190577: step: 772/530, loss: 0.0021470848005264997 2023-01-22 19:07:14.265039: step: 776/530, loss: 0.002884796354919672 2023-01-22 19:07:15.351625: step: 780/530, loss: 0.004891611635684967 2023-01-22 19:07:16.437967: step: 784/530, loss: 0.01020373497158289 2023-01-22 19:07:17.555212: step: 788/530, loss: 0.004425450228154659 2023-01-22 19:07:18.652828: step: 792/530, loss: 0.007049204781651497 2023-01-22 19:07:19.739327: step: 796/530, loss: 0.010170838795602322 2023-01-22 19:07:20.840739: step: 800/530, loss: 0.0035678057465702295 2023-01-22 19:07:21.945929: step: 804/530, loss: 0.010326921939849854 2023-01-22 19:07:23.020692: step: 808/530, loss: 0.04217381402850151 2023-01-22 19:07:24.112330: step: 812/530, loss: 0.0013110467698425055 2023-01-22 19:07:25.216877: step: 816/530, loss: 0.014697118662297726 2023-01-22 19:07:26.314217: step: 820/530, loss: 0.0015910804504528642 2023-01-22 19:07:27.406781: step: 824/530, loss: 0.006394257768988609 2023-01-22 19:07:28.515049: step: 828/530, loss: 0.004869935568422079 2023-01-22 19:07:29.596237: step: 832/530, loss: 0.01354996394366026 2023-01-22 19:07:30.697591: step: 836/530, loss: 0.01052496675401926 2023-01-22 19:07:31.788196: step: 840/530, loss: 0.003269155975431204 2023-01-22 19:07:32.897110: step: 844/530, loss: 0.018886715173721313 2023-01-22 19:07:34.003619: step: 848/530, loss: 0.00438551465049386 2023-01-22 19:07:35.101008: step: 852/530, loss: 0.006867893505841494 2023-01-22 19:07:36.195650: step: 856/530, loss: 0.001360465888865292 2023-01-22 19:07:37.298826: step: 860/530, loss: 0.007910734042525291 2023-01-22 19:07:38.395898: step: 864/530, loss: 7.721110159764066e-05 2023-01-22 19:07:39.494950: step: 868/530, loss: 0.0023887630086392164 2023-01-22 19:07:40.602816: step: 872/530, loss: 0.00022753450321033597 2023-01-22 19:07:41.706137: step: 876/530, loss: 0.006508971098810434 2023-01-22 19:07:42.803086: step: 880/530, loss: 0.0015781933907419443 2023-01-22 19:07:43.904766: step: 884/530, loss: 0.009550977498292923 2023-01-22 19:07:44.992783: step: 888/530, loss: 0.0021734812762588263 2023-01-22 19:07:46.073475: step: 892/530, loss: 0.006952111143618822 2023-01-22 19:07:47.168453: step: 896/530, loss: 0.0006070664385333657 2023-01-22 19:07:48.266071: step: 900/530, loss: 0.001960593508556485 2023-01-22 19:07:49.361053: step: 904/530, loss: 0.00942571833729744 2023-01-22 19:07:50.464958: step: 908/530, loss: 0.004294681828469038 2023-01-22 19:07:51.542626: step: 912/530, loss: 0.007583240978419781 2023-01-22 19:07:52.625974: step: 916/530, loss: 0.0031840302981436253 2023-01-22 19:07:53.726078: step: 920/530, loss: 0.0025073098950088024 2023-01-22 19:07:54.816187: step: 924/530, loss: 0.0033496415708214045 2023-01-22 19:07:55.916587: step: 928/530, loss: 0.004370107315480709 2023-01-22 19:07:57.018159: step: 932/530, loss: 0.000515086343511939 2023-01-22 19:07:58.138601: step: 936/530, loss: 0.010644691064953804 2023-01-22 19:07:59.217728: step: 940/530, loss: 0.0015098314033821225 2023-01-22 19:08:00.321508: step: 944/530, loss: 0.00036256806924939156 2023-01-22 19:08:01.419654: step: 948/530, loss: 0.005524048116058111 2023-01-22 19:08:02.510187: step: 952/530, loss: 0.0008494430803693831 2023-01-22 19:08:03.631098: step: 956/530, loss: 0.006233882158994675 2023-01-22 19:08:04.711268: step: 960/530, loss: 0.003864891128614545 2023-01-22 19:08:05.791229: step: 964/530, loss: 0.0045983027666807175 2023-01-22 19:08:06.877079: step: 968/530, loss: 0.0032973329070955515 2023-01-22 19:08:07.985765: step: 972/530, loss: 0.0009336351067759097 2023-01-22 19:08:09.100138: step: 976/530, loss: 0.002526262542232871 2023-01-22 19:08:10.174116: step: 980/530, loss: 0.006512057967483997 2023-01-22 19:08:11.287115: step: 984/530, loss: 7.263862789841369e-05 2023-01-22 19:08:12.386046: step: 988/530, loss: 0.004556652624160051 2023-01-22 19:08:13.465273: step: 992/530, loss: 0.003534437622874975 2023-01-22 19:08:14.590534: step: 996/530, loss: 0.004351919516921043 2023-01-22 19:08:15.657885: step: 1000/530, loss: 0.0018057613633573055 2023-01-22 19:08:16.725427: step: 1004/530, loss: 0.003542422316968441 2023-01-22 19:08:17.837363: step: 1008/530, loss: 0.0035890303552150726 2023-01-22 19:08:18.927047: step: 1012/530, loss: 0.005569561384618282 2023-01-22 19:08:20.024208: step: 1016/530, loss: 0.0074818190187215805 2023-01-22 19:08:21.087719: step: 1020/530, loss: 0.0006150158005766571 2023-01-22 19:08:22.209153: step: 1024/530, loss: 0.00553083885461092 2023-01-22 19:08:23.316306: step: 1028/530, loss: 0.00024989820667542517 2023-01-22 19:08:24.424570: step: 1032/530, loss: 0.00281052989885211 2023-01-22 19:08:25.525106: step: 1036/530, loss: 0.006160425953567028 2023-01-22 19:08:26.624852: step: 1040/530, loss: 0.006961078383028507 2023-01-22 19:08:27.712455: step: 1044/530, loss: 0.022290097549557686 2023-01-22 19:08:28.786333: step: 1048/530, loss: 0.0015631720889359713 2023-01-22 19:08:29.885049: step: 1052/530, loss: 0.00197742972522974 2023-01-22 19:08:30.975697: step: 1056/530, loss: 0.0014348529512062669 2023-01-22 19:08:32.073971: step: 1060/530, loss: 0.004474959336221218 2023-01-22 19:08:33.177638: step: 1064/530, loss: 0.00034423902980051935 2023-01-22 19:08:34.266114: step: 1068/530, loss: 0.0015322730178013444 2023-01-22 19:08:35.369928: step: 1072/530, loss: 0.002828197320923209 2023-01-22 19:08:36.451662: step: 1076/530, loss: 0.006610402371734381 2023-01-22 19:08:37.588678: step: 1080/530, loss: 0.0006098880548961461 2023-01-22 19:08:38.718096: step: 1084/530, loss: 0.0016893999418243766 2023-01-22 19:08:39.820784: step: 1088/530, loss: 0.015406097285449505 2023-01-22 19:08:40.898038: step: 1092/530, loss: 0.0007497449987567961 2023-01-22 19:08:41.967226: step: 1096/530, loss: 0.0034004985354840755 2023-01-22 19:08:43.045889: step: 1100/530, loss: 0.006882116198539734 2023-01-22 19:08:44.139261: step: 1104/530, loss: 0.00790882483124733 2023-01-22 19:08:45.266248: step: 1108/530, loss: 0.005721793510019779 2023-01-22 19:08:46.353637: step: 1112/530, loss: 0.011735101230442524 2023-01-22 19:08:47.446334: step: 1116/530, loss: 0.0008561141439713538 2023-01-22 19:08:48.564118: step: 1120/530, loss: 0.006097300909459591 2023-01-22 19:08:49.699094: step: 1124/530, loss: 0.006091817282140255 2023-01-22 19:08:50.800791: step: 1128/530, loss: 0.00031029951060190797 2023-01-22 19:08:51.913776: step: 1132/530, loss: 0.0028116947505623102 2023-01-22 19:08:53.029243: step: 1136/530, loss: 0.0028461655601859093 2023-01-22 19:08:54.130132: step: 1140/530, loss: 0.0017151185311377048 2023-01-22 19:08:55.210942: step: 1144/530, loss: 0.0021916173864156008 2023-01-22 19:08:56.296752: step: 1148/530, loss: 0.0028402898460626602 2023-01-22 19:08:57.384705: step: 1152/530, loss: 0.008344939909875393 2023-01-22 19:08:58.486434: step: 1156/530, loss: 0.0025396314449608326 2023-01-22 19:08:59.572004: step: 1160/530, loss: 0.0022760778665542603 2023-01-22 19:09:00.681642: step: 1164/530, loss: 0.0015138674061745405 2023-01-22 19:09:01.786438: step: 1168/530, loss: 0.0048512788489460945 2023-01-22 19:09:02.910018: step: 1172/530, loss: 0.0025135655887424946 2023-01-22 19:09:04.000980: step: 1176/530, loss: 0.0012192686554044485 2023-01-22 19:09:05.069298: step: 1180/530, loss: 0.003668656339868903 2023-01-22 19:09:06.157776: step: 1184/530, loss: 0.0010577113134786487 2023-01-22 19:09:07.240345: step: 1188/530, loss: 0.0037559799384325743 2023-01-22 19:09:08.331753: step: 1192/530, loss: 0.006520634517073631 2023-01-22 19:09:09.439071: step: 1196/530, loss: 0.005236170720309019 2023-01-22 19:09:10.549423: step: 1200/530, loss: 0.0003623549418989569 2023-01-22 19:09:11.635524: step: 1204/530, loss: 0.0013735555112361908 2023-01-22 19:09:12.731054: step: 1208/530, loss: 0.0009886849438771605 2023-01-22 19:09:13.809047: step: 1212/530, loss: 0.0024561192840337753 2023-01-22 19:09:14.951286: step: 1216/530, loss: 0.004731297492980957 2023-01-22 19:09:16.077289: step: 1220/530, loss: 0.0025116626638919115 2023-01-22 19:09:17.148102: step: 1224/530, loss: 0.003190577495843172 2023-01-22 19:09:18.246177: step: 1228/530, loss: 0.009936847724020481 2023-01-22 19:09:19.338455: step: 1232/530, loss: 0.0006460713921114802 2023-01-22 19:09:20.422765: step: 1236/530, loss: 0.00035688711795955896 2023-01-22 19:09:21.503547: step: 1240/530, loss: 0.002589360112324357 2023-01-22 19:09:22.615067: step: 1244/530, loss: 0.002872176468372345 2023-01-22 19:09:23.706767: step: 1248/530, loss: 0.005783560685813427 2023-01-22 19:09:24.799648: step: 1252/530, loss: 0.009352799504995346 2023-01-22 19:09:25.894722: step: 1256/530, loss: 0.0019772867672145367 2023-01-22 19:09:26.984098: step: 1260/530, loss: 0.01452991459518671 2023-01-22 19:09:28.092630: step: 1264/530, loss: 0.0008392550516873598 2023-01-22 19:09:29.194730: step: 1268/530, loss: 0.002110585570335388 2023-01-22 19:09:30.288227: step: 1272/530, loss: 0.0 2023-01-22 19:09:31.399508: step: 1276/530, loss: 0.0009411110077053308 2023-01-22 19:09:32.500545: step: 1280/530, loss: 0.0019496346358209848 2023-01-22 19:09:33.581032: step: 1284/530, loss: 0.0007129334844648838 2023-01-22 19:09:34.682808: step: 1288/530, loss: 5.188986961002229e-06 2023-01-22 19:09:35.786794: step: 1292/530, loss: 3.364436634001322e-05 2023-01-22 19:09:36.871636: step: 1296/530, loss: 3.258133074268699e-05 2023-01-22 19:09:37.953061: step: 1300/530, loss: 0.014258338138461113 2023-01-22 19:09:39.058807: step: 1304/530, loss: 0.008571045473217964 2023-01-22 19:09:40.175231: step: 1308/530, loss: 0.0028334816452115774 2023-01-22 19:09:41.274062: step: 1312/530, loss: 0.0011947295861318707 2023-01-22 19:09:42.362270: step: 1316/530, loss: 0.01433481927961111 2023-01-22 19:09:43.467788: step: 1320/530, loss: 0.01468334998935461 2023-01-22 19:09:44.570570: step: 1324/530, loss: 0.004220316186547279 2023-01-22 19:09:45.668325: step: 1328/530, loss: 0.0023487682919949293 2023-01-22 19:09:46.778549: step: 1332/530, loss: 0.0037937385495752096 2023-01-22 19:09:47.868023: step: 1336/530, loss: 0.005685847718268633 2023-01-22 19:09:48.962783: step: 1340/530, loss: 0.0036236243322491646 2023-01-22 19:09:50.063640: step: 1344/530, loss: 0.0037714182399213314 2023-01-22 19:09:51.154517: step: 1348/530, loss: 0.0027703167870640755 2023-01-22 19:09:52.253773: step: 1352/530, loss: 0.0034639134537428617 2023-01-22 19:09:53.358513: step: 1356/530, loss: 0.0013512304285541177 2023-01-22 19:09:54.454502: step: 1360/530, loss: 0.0038040808867663145 2023-01-22 19:09:55.542542: step: 1364/530, loss: 0.003248954890295863 2023-01-22 19:09:56.642830: step: 1368/530, loss: 0.0013664424186572433 2023-01-22 19:09:57.716985: step: 1372/530, loss: 0.0016001887852326035 2023-01-22 19:09:58.823730: step: 1376/530, loss: 0.0051473951898515224 2023-01-22 19:09:59.921293: step: 1380/530, loss: 0.029464716091752052 2023-01-22 19:10:01.028448: step: 1384/530, loss: 0.00023289750970434397 2023-01-22 19:10:02.139857: step: 1388/530, loss: 0.04877311363816261 2023-01-22 19:10:03.249516: step: 1392/530, loss: 0.005440156906843185 2023-01-22 19:10:04.336125: step: 1396/530, loss: 0.0007012205896899104 2023-01-22 19:10:05.434366: step: 1400/530, loss: 0.0007147606229409575 2023-01-22 19:10:06.517929: step: 1404/530, loss: 0.0024747319985181093 2023-01-22 19:10:07.625035: step: 1408/530, loss: 0.0021012744400650263 2023-01-22 19:10:08.734315: step: 1412/530, loss: 0.003056436777114868 2023-01-22 19:10:09.843633: step: 1416/530, loss: 0.007285845000296831 2023-01-22 19:10:10.941568: step: 1420/530, loss: 0.006533654872328043 2023-01-22 19:10:12.043689: step: 1424/530, loss: 0.0011564880842342973 2023-01-22 19:10:13.159791: step: 1428/530, loss: 0.0038760975003242493 2023-01-22 19:10:14.267932: step: 1432/530, loss: 0.00046560607734136283 2023-01-22 19:10:15.382395: step: 1436/530, loss: 0.007719695568084717 2023-01-22 19:10:16.490292: step: 1440/530, loss: 0.000948564033024013 2023-01-22 19:10:17.564176: step: 1444/530, loss: 0.012988336384296417 2023-01-22 19:10:18.668581: step: 1448/530, loss: 0.0023189648054540157 2023-01-22 19:10:19.757293: step: 1452/530, loss: 0.0009147964883595705 2023-01-22 19:10:20.844930: step: 1456/530, loss: 0.0035243304446339607 2023-01-22 19:10:21.936675: step: 1460/530, loss: 0.003154285717755556 2023-01-22 19:10:23.036241: step: 1464/530, loss: 0.017779337242245674 2023-01-22 19:10:24.117153: step: 1468/530, loss: 0.002096073003485799 2023-01-22 19:10:25.214303: step: 1472/530, loss: 0.011108839884400368 2023-01-22 19:10:26.304563: step: 1476/530, loss: 0.000411507033277303 2023-01-22 19:10:27.423067: step: 1480/530, loss: 0.0070840464904904366 2023-01-22 19:10:28.521436: step: 1484/530, loss: 0.0040029967203736305 2023-01-22 19:10:29.620293: step: 1488/530, loss: 0.018261317163705826 2023-01-22 19:10:30.706335: step: 1492/530, loss: 0.022633962333202362 2023-01-22 19:10:31.783524: step: 1496/530, loss: 0.0007916140602901578 2023-01-22 19:10:32.873725: step: 1500/530, loss: 0.001371148508042097 2023-01-22 19:10:34.009337: step: 1504/530, loss: 0.020567800849676132 2023-01-22 19:10:35.094949: step: 1508/530, loss: 0.008351309224963188 2023-01-22 19:10:36.182820: step: 1512/530, loss: 0.0036118722055107355 2023-01-22 19:10:37.281129: step: 1516/530, loss: 0.024894297122955322 2023-01-22 19:10:38.344417: step: 1520/530, loss: 0.00034612778108567 2023-01-22 19:10:39.428291: step: 1524/530, loss: 0.0061981286853551865 2023-01-22 19:10:40.535178: step: 1528/530, loss: 0.016763020306825638 2023-01-22 19:10:41.604143: step: 1532/530, loss: 0.0008295041043311357 2023-01-22 19:10:42.686561: step: 1536/530, loss: 0.010216237045824528 2023-01-22 19:10:43.791908: step: 1540/530, loss: 0.0017834630561992526 2023-01-22 19:10:44.892340: step: 1544/530, loss: 0.012036183848977089 2023-01-22 19:10:45.967860: step: 1548/530, loss: 0.0027237434405833483 2023-01-22 19:10:47.058894: step: 1552/530, loss: 0.007208657916635275 2023-01-22 19:10:48.175888: step: 1556/530, loss: 0.009769456461071968 2023-01-22 19:10:49.257139: step: 1560/530, loss: 0.0007078879280015826 2023-01-22 19:10:50.348179: step: 1564/530, loss: 0.002872936427593231 2023-01-22 19:10:51.436172: step: 1568/530, loss: 0.005300926975905895 2023-01-22 19:10:52.518085: step: 1572/530, loss: 0.0014098727842792869 2023-01-22 19:10:53.613768: step: 1576/530, loss: 0.006817088462412357 2023-01-22 19:10:54.718659: step: 1580/530, loss: 0.0013497865293174982 2023-01-22 19:10:55.815067: step: 1584/530, loss: 0.00028876421856693923 2023-01-22 19:10:56.936673: step: 1588/530, loss: 0.004325491841882467 2023-01-22 19:10:58.030077: step: 1592/530, loss: 0.011348665691912174 2023-01-22 19:10:59.125052: step: 1596/530, loss: 0.0035355770960450172 2023-01-22 19:11:00.198933: step: 1600/530, loss: 0.00013748608762398362 2023-01-22 19:11:01.301563: step: 1604/530, loss: 0.002196061657741666 2023-01-22 19:11:02.389189: step: 1608/530, loss: 0.0021907149348407984 2023-01-22 19:11:03.491333: step: 1612/530, loss: 0.0043025934137403965 2023-01-22 19:11:04.589461: step: 1616/530, loss: 0.004991177003830671 2023-01-22 19:11:05.680344: step: 1620/530, loss: 0.0009854704840108752 2023-01-22 19:11:06.771391: step: 1624/530, loss: 0.0009910885710269213 2023-01-22 19:11:07.893114: step: 1628/530, loss: 0.013235753402113914 2023-01-22 19:11:08.984111: step: 1632/530, loss: 0.002808724297210574 2023-01-22 19:11:10.084383: step: 1636/530, loss: 0.002283906564116478 2023-01-22 19:11:11.176699: step: 1640/530, loss: 0.005316497758030891 2023-01-22 19:11:12.290886: step: 1644/530, loss: 0.004256706219166517 2023-01-22 19:11:13.397918: step: 1648/530, loss: 0.0075982981361448765 2023-01-22 19:11:14.510617: step: 1652/530, loss: 0.006811073049902916 2023-01-22 19:11:15.603651: step: 1656/530, loss: 0.0011994980741292238 2023-01-22 19:11:16.689552: step: 1660/530, loss: 0.001670225989073515 2023-01-22 19:11:17.769419: step: 1664/530, loss: 0.0027181445620954037 2023-01-22 19:11:18.875563: step: 1668/530, loss: 0.0022412072867155075 2023-01-22 19:11:19.962000: step: 1672/530, loss: 0.002797999419271946 2023-01-22 19:11:21.073130: step: 1676/530, loss: 0.00272500142455101 2023-01-22 19:11:22.165031: step: 1680/530, loss: 0.0052646188996732235 2023-01-22 19:11:23.255458: step: 1684/530, loss: 2.53915750363376e-05 2023-01-22 19:11:24.348708: step: 1688/530, loss: 0.00134277471806854 2023-01-22 19:11:25.458643: step: 1692/530, loss: 0.013469576835632324 2023-01-22 19:11:26.550962: step: 1696/530, loss: 0.008590266108512878 2023-01-22 19:11:27.651916: step: 1700/530, loss: 0.0021843782160431147 2023-01-22 19:11:28.751748: step: 1704/530, loss: 0.007513238582760096 2023-01-22 19:11:29.844586: step: 1708/530, loss: 0.0145924286916852 2023-01-22 19:11:30.947065: step: 1712/530, loss: 0.002340807346627116 2023-01-22 19:11:32.048274: step: 1716/530, loss: 0.01064359862357378 2023-01-22 19:11:33.140120: step: 1720/530, loss: 0.007667229976505041 2023-01-22 19:11:34.225039: step: 1724/530, loss: 0.006118538789451122 2023-01-22 19:11:35.314304: step: 1728/530, loss: 0.004504764452576637 2023-01-22 19:11:36.411003: step: 1732/530, loss: 0.006519198417663574 2023-01-22 19:11:37.510277: step: 1736/530, loss: 0.0039019996766000986 2023-01-22 19:11:38.604144: step: 1740/530, loss: 0.003268276108428836 2023-01-22 19:11:39.698602: step: 1744/530, loss: 0.0038736071437597275 2023-01-22 19:11:40.803401: step: 1748/530, loss: 0.010874832980334759 2023-01-22 19:11:41.894768: step: 1752/530, loss: 0.003607241902500391 2023-01-22 19:11:42.982265: step: 1756/530, loss: 0.0023108585737645626 2023-01-22 19:11:44.059938: step: 1760/530, loss: 0.0 2023-01-22 19:11:45.148964: step: 1764/530, loss: 0.003200850449502468 2023-01-22 19:11:46.248251: step: 1768/530, loss: 0.009596412070095539 2023-01-22 19:11:47.335317: step: 1772/530, loss: 0.002132405759766698 2023-01-22 19:11:48.415956: step: 1776/530, loss: 0.00011658322910079733 2023-01-22 19:11:49.515175: step: 1780/530, loss: 0.001403294038027525 2023-01-22 19:11:50.612839: step: 1784/530, loss: 0.0010689322371035814 2023-01-22 19:11:51.704487: step: 1788/530, loss: 0.00023162271827459335 2023-01-22 19:11:52.793385: step: 1792/530, loss: 0.00031199815566651523 2023-01-22 19:11:53.880610: step: 1796/530, loss: 0.011649326421320438 2023-01-22 19:11:54.953511: step: 1800/530, loss: 0.0030095886904746294 2023-01-22 19:11:56.072955: step: 1804/530, loss: 0.0045340885408222675 2023-01-22 19:11:57.161486: step: 1808/530, loss: 0.004164821468293667 2023-01-22 19:11:58.246700: step: 1812/530, loss: 0.0030954324174672365 2023-01-22 19:11:59.339257: step: 1816/530, loss: 0.004995994735509157 2023-01-22 19:12:00.448894: step: 1820/530, loss: 0.00032775578438304365 2023-01-22 19:12:01.558581: step: 1824/530, loss: 0.0033056489191949368 2023-01-22 19:12:02.667606: step: 1828/530, loss: 0.0016626243013888597 2023-01-22 19:12:03.760411: step: 1832/530, loss: 1.0593716979201417e-05 2023-01-22 19:12:04.846573: step: 1836/530, loss: 0.006667034700512886 2023-01-22 19:12:05.953761: step: 1840/530, loss: 0.009982477873563766 2023-01-22 19:12:07.052494: step: 1844/530, loss: 0.01013704389333725 2023-01-22 19:12:08.182401: step: 1848/530, loss: 0.00021069031208753586 2023-01-22 19:12:09.257584: step: 1852/530, loss: 0.002714292611926794 2023-01-22 19:12:10.351803: step: 1856/530, loss: 0.0003858456911984831 2023-01-22 19:12:11.445919: step: 1860/530, loss: 0.014455663971602917 2023-01-22 19:12:12.547046: step: 1864/530, loss: 0.003604452358558774 2023-01-22 19:12:13.652881: step: 1868/530, loss: 0.012609553523361683 2023-01-22 19:12:14.740438: step: 1872/530, loss: 0.0004549937439151108 2023-01-22 19:12:15.810469: step: 1876/530, loss: 0.0034798739943653345 2023-01-22 19:12:16.909736: step: 1880/530, loss: 0.005634340923279524 2023-01-22 19:12:18.007716: step: 1884/530, loss: 8.543483272660524e-05 2023-01-22 19:12:19.094025: step: 1888/530, loss: 0.008969456888735294 2023-01-22 19:12:20.175486: step: 1892/530, loss: 0.008344369940459728 2023-01-22 19:12:21.295700: step: 1896/530, loss: 0.0026686647906899452 2023-01-22 19:12:22.383124: step: 1900/530, loss: 0.01765001378953457 2023-01-22 19:12:23.478300: step: 1904/530, loss: 0.00037060148315504193 2023-01-22 19:12:24.561464: step: 1908/530, loss: 0.003669881261885166 2023-01-22 19:12:25.671636: step: 1912/530, loss: 0.0032493583858013153 2023-01-22 19:12:26.773479: step: 1916/530, loss: 0.005560439079999924 2023-01-22 19:12:27.872929: step: 1920/530, loss: 0.015126613900065422 2023-01-22 19:12:29.001262: step: 1924/530, loss: 0.03719492256641388 2023-01-22 19:12:30.099058: step: 1928/530, loss: 0.0004608245217241347 2023-01-22 19:12:31.190899: step: 1932/530, loss: 0.0004902182263322175 2023-01-22 19:12:32.284147: step: 1936/530, loss: 0.00780758960172534 2023-01-22 19:12:33.379122: step: 1940/530, loss: 0.0021297961939126253 2023-01-22 19:12:34.470520: step: 1944/530, loss: 0.010691937990486622 2023-01-22 19:12:35.554499: step: 1948/530, loss: 0.004143524449318647 2023-01-22 19:12:36.636569: step: 1952/530, loss: 0.005331322085112333 2023-01-22 19:12:37.740997: step: 1956/530, loss: 0.03961164876818657 2023-01-22 19:12:38.830217: step: 1960/530, loss: 0.008898531086742878 2023-01-22 19:12:39.925009: step: 1964/530, loss: 0.002609647111967206 2023-01-22 19:12:41.044754: step: 1968/530, loss: 0.004613959696143866 2023-01-22 19:12:42.133888: step: 1972/530, loss: 0.002736974973231554 2023-01-22 19:12:43.225176: step: 1976/530, loss: 0.0058308071456849575 2023-01-22 19:12:44.330598: step: 1980/530, loss: 0.008194469846785069 2023-01-22 19:12:45.439280: step: 1984/530, loss: 0.001225427258759737 2023-01-22 19:12:46.518939: step: 1988/530, loss: 0.00017375429160892963 2023-01-22 19:12:47.608990: step: 1992/530, loss: 0.004000471904873848 2023-01-22 19:12:48.697929: step: 1996/530, loss: 0.0037554746959358454 2023-01-22 19:12:49.835208: step: 2000/530, loss: 0.0032068383879959583 2023-01-22 19:12:50.925617: step: 2004/530, loss: 0.007411566097289324 2023-01-22 19:12:52.035683: step: 2008/530, loss: 0.015719568356871605 2023-01-22 19:12:53.124177: step: 2012/530, loss: 0.004038520157337189 2023-01-22 19:12:54.225539: step: 2016/530, loss: 0.0015511835226789117 2023-01-22 19:12:55.304863: step: 2020/530, loss: 0.001353686093352735 2023-01-22 19:12:56.441338: step: 2024/530, loss: 0.0034951341804116964 2023-01-22 19:12:57.535594: step: 2028/530, loss: 0.0031962350476533175 2023-01-22 19:12:58.622799: step: 2032/530, loss: 0.003692465601488948 2023-01-22 19:12:59.723710: step: 2036/530, loss: 0.0018718288047239184 2023-01-22 19:13:00.817035: step: 2040/530, loss: 0.0010259640403091908 2023-01-22 19:13:01.908467: step: 2044/530, loss: 0.011069604195654392 2023-01-22 19:13:03.011517: step: 2048/530, loss: 0.009898328222334385 2023-01-22 19:13:04.113754: step: 2052/530, loss: 0.002545662224292755 2023-01-22 19:13:05.208363: step: 2056/530, loss: 0.004568136762827635 2023-01-22 19:13:06.319563: step: 2060/530, loss: 0.004701043479144573 2023-01-22 19:13:07.390911: step: 2064/530, loss: 0.005160473752766848 2023-01-22 19:13:08.477543: step: 2068/530, loss: 0.0006103627383708954 2023-01-22 19:13:09.560483: step: 2072/530, loss: 8.681625331519172e-05 2023-01-22 19:13:10.659102: step: 2076/530, loss: 0.0011636678827926517 2023-01-22 19:13:11.800921: step: 2080/530, loss: 0.002393764676526189 2023-01-22 19:13:12.883075: step: 2084/530, loss: 0.0002670777903404087 2023-01-22 19:13:13.959999: step: 2088/530, loss: 0.0063750711269676685 2023-01-22 19:13:15.050563: step: 2092/530, loss: 0.00611089589074254 2023-01-22 19:13:16.136886: step: 2096/530, loss: 0.013167677447199821 2023-01-22 19:13:17.221658: step: 2100/530, loss: 0.007116015534847975 2023-01-22 19:13:18.310598: step: 2104/530, loss: 0.002222956158220768 2023-01-22 19:13:19.397748: step: 2108/530, loss: 0.006987978704273701 2023-01-22 19:13:20.501356: step: 2112/530, loss: 0.002270687837153673 2023-01-22 19:13:21.605085: step: 2116/530, loss: 0.02031017281115055 2023-01-22 19:13:22.702542: step: 2120/530, loss: 0.002151333726942539 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3383481344237158, 'r': 0.3588929926809433, 'f1': 0.34831787687450666}, 'combined': 0.2566552776970049, 'stategy': 1, 'epoch': 10} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.333764327385087, 'r': 0.2865553275670183, 'f1': 0.3083634232786115}, 'combined': 0.1915099155098745, 'stategy': 1, 'epoch': 10} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3443320163470188, 'r': 0.3436786349118252, 'f1': 0.344005015381827}, 'combined': 0.2534773797550304, 'stategy': 1, 'epoch': 10} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.31718826911741993, 'r': 0.28487334160100625, 'f1': 0.30016357306786584}, 'combined': 0.18641737695793775, 'stategy': 1, 'epoch': 10} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3459025707760525, 'r': 0.3327753384885363, 'f1': 0.3392119988074635}, 'combined': 0.2499456833318152, 'stategy': 1, 'epoch': 10} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3443108757817616, 'r': 0.2926472498006878, 'f1': 0.31638384636936684}, 'combined': 0.1964910203767647, 'stategy': 1, 'epoch': 10} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 10} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 10} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5208333333333334, 'r': 0.3232758620689655, 'f1': 0.39893617021276595}, 'combined': 0.26595744680851063, 'stategy': 1, 'epoch': 10} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 11 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 19:15:50.316566: step: 4/530, loss: 0.00239155744202435 2023-01-22 19:15:51.404871: step: 8/530, loss: 0.0024033032823354006 2023-01-22 19:15:52.508281: step: 12/530, loss: 0.00449529429897666 2023-01-22 19:15:53.615469: step: 16/530, loss: 0.0058736661449074745 2023-01-22 19:15:54.739003: step: 20/530, loss: 0.00034863376640714705 2023-01-22 19:15:55.826321: step: 24/530, loss: 0.015756824985146523 2023-01-22 19:15:56.904578: step: 28/530, loss: 0.00029133513453416526 2023-01-22 19:15:57.995464: step: 32/530, loss: 0.0010171124013140798 2023-01-22 19:15:59.084778: step: 36/530, loss: 0.005919092800468206 2023-01-22 19:16:00.169227: step: 40/530, loss: 0.0014844770776107907 2023-01-22 19:16:01.251967: step: 44/530, loss: 0.0005742798093706369 2023-01-22 19:16:02.337838: step: 48/530, loss: 0.001526810578070581 2023-01-22 19:16:03.426159: step: 52/530, loss: 0.017103327438235283 2023-01-22 19:16:04.520744: step: 56/530, loss: 0.004896756261587143 2023-01-22 19:16:05.609639: step: 60/530, loss: 0.003529720474034548 2023-01-22 19:16:06.718386: step: 64/530, loss: 0.003721288638189435 2023-01-22 19:16:07.806061: step: 68/530, loss: 0.013919164426624775 2023-01-22 19:16:08.917734: step: 72/530, loss: 0.009428983554244041 2023-01-22 19:16:09.997097: step: 76/530, loss: 0.0020549967885017395 2023-01-22 19:16:11.082933: step: 80/530, loss: 0.0005727734533138573 2023-01-22 19:16:12.175975: step: 84/530, loss: 0.029020557180047035 2023-01-22 19:16:13.287653: step: 88/530, loss: 0.0009710404556244612 2023-01-22 19:16:14.366612: step: 92/530, loss: 0.0140199214220047 2023-01-22 19:16:15.452492: step: 96/530, loss: 0.0027598401065915823 2023-01-22 19:16:16.573154: step: 100/530, loss: 0.002796739572659135 2023-01-22 19:16:17.643076: step: 104/530, loss: 0.0011954504298046231 2023-01-22 19:16:18.746690: step: 108/530, loss: 0.024249127134680748 2023-01-22 19:16:19.875829: step: 112/530, loss: 0.005792188923805952 2023-01-22 19:16:20.946053: step: 116/530, loss: 0.006264966446906328 2023-01-22 19:16:22.024152: step: 120/530, loss: 0.003406588453799486 2023-01-22 19:16:23.105365: step: 124/530, loss: 0.0008385282126255333 2023-01-22 19:16:24.179906: step: 128/530, loss: 0.006097255740314722 2023-01-22 19:16:25.284151: step: 132/530, loss: 0.004822678864002228 2023-01-22 19:16:26.360874: step: 136/530, loss: 0.009024323895573616 2023-01-22 19:16:27.450447: step: 140/530, loss: 0.004446942359209061 2023-01-22 19:16:28.528081: step: 144/530, loss: 0.006993423216044903 2023-01-22 19:16:29.629777: step: 148/530, loss: 0.0014891955070197582 2023-01-22 19:16:30.723302: step: 152/530, loss: 0.0013069381238892674 2023-01-22 19:16:31.829394: step: 156/530, loss: 0.007261795457452536 2023-01-22 19:16:32.896630: step: 160/530, loss: 0.003443314926698804 2023-01-22 19:16:34.018932: step: 164/530, loss: 0.027477990835905075 2023-01-22 19:16:35.112428: step: 168/530, loss: 0.015958357602357864 2023-01-22 19:16:36.212812: step: 172/530, loss: 6.025932634656783e-06 2023-01-22 19:16:37.302867: step: 176/530, loss: 0.0012165606021881104 2023-01-22 19:16:38.393263: step: 180/530, loss: 0.006017171777784824 2023-01-22 19:16:39.458585: step: 184/530, loss: 0.0029329550452530384 2023-01-22 19:16:40.564615: step: 188/530, loss: 0.006054393015801907 2023-01-22 19:16:41.660496: step: 192/530, loss: 0.00127957493532449 2023-01-22 19:16:42.759761: step: 196/530, loss: 0.008293425664305687 2023-01-22 19:16:43.900829: step: 200/530, loss: 0.00937639269977808 2023-01-22 19:16:44.997775: step: 204/530, loss: 0.0019085989333689213 2023-01-22 19:16:46.085092: step: 208/530, loss: 0.001609591068699956 2023-01-22 19:16:47.151626: step: 212/530, loss: 0.0010371814714744687 2023-01-22 19:16:48.237183: step: 216/530, loss: 0.0026844250969588757 2023-01-22 19:16:49.335989: step: 220/530, loss: 0.0048226360231637955 2023-01-22 19:16:50.435442: step: 224/530, loss: 0.04717119038105011 2023-01-22 19:16:51.523322: step: 228/530, loss: 0.007930617779493332 2023-01-22 19:16:52.625823: step: 232/530, loss: 0.00222823116928339 2023-01-22 19:16:53.716671: step: 236/530, loss: 0.004855830688029528 2023-01-22 19:16:54.821839: step: 240/530, loss: 0.023386413231492043 2023-01-22 19:16:55.911796: step: 244/530, loss: 0.008373802527785301 2023-01-22 19:16:57.012620: step: 248/530, loss: 0.00043708784505724907 2023-01-22 19:16:58.089163: step: 252/530, loss: 0.01068387646228075 2023-01-22 19:16:59.173312: step: 256/530, loss: 0.0005089847836643457 2023-01-22 19:17:00.256848: step: 260/530, loss: 0.0026610034983605146 2023-01-22 19:17:01.375219: step: 264/530, loss: 0.00679350271821022 2023-01-22 19:17:02.455460: step: 268/530, loss: 0.00031216413481161 2023-01-22 19:17:03.554894: step: 272/530, loss: 1.621147930563893e-05 2023-01-22 19:17:04.645136: step: 276/530, loss: 0.037259966135025024 2023-01-22 19:17:05.722081: step: 280/530, loss: 0.0030288512352854013 2023-01-22 19:17:06.825325: step: 284/530, loss: 0.003950710874050856 2023-01-22 19:17:07.917095: step: 288/530, loss: 0.006789867766201496 2023-01-22 19:17:09.008219: step: 292/530, loss: 0.009791080839931965 2023-01-22 19:17:10.121361: step: 296/530, loss: 0.010872495360672474 2023-01-22 19:17:11.214638: step: 300/530, loss: 0.0014845393598079681 2023-01-22 19:17:12.289903: step: 304/530, loss: 0.0048056114464998245 2023-01-22 19:17:13.376829: step: 308/530, loss: 0.02465643733739853 2023-01-22 19:17:14.459583: step: 312/530, loss: 0.0028367226477712393 2023-01-22 19:17:15.544547: step: 316/530, loss: 0.0005825771950185299 2023-01-22 19:17:16.643296: step: 320/530, loss: 0.010419790633022785 2023-01-22 19:17:17.741026: step: 324/530, loss: 0.0012331544421613216 2023-01-22 19:17:18.824728: step: 328/530, loss: 0.008323131129145622 2023-01-22 19:17:19.921055: step: 332/530, loss: 0.022704927250742912 2023-01-22 19:17:21.032961: step: 336/530, loss: 0.02240392379462719 2023-01-22 19:17:22.142205: step: 340/530, loss: 0.021398130804300308 2023-01-22 19:17:23.236422: step: 344/530, loss: 0.0019201998366042972 2023-01-22 19:17:24.315839: step: 348/530, loss: 7.556645141448826e-05 2023-01-22 19:17:25.413278: step: 352/530, loss: 0.0010268030455335975 2023-01-22 19:17:26.503651: step: 356/530, loss: 0.001753143034875393 2023-01-22 19:17:27.599371: step: 360/530, loss: 0.001639651134610176 2023-01-22 19:17:28.707199: step: 364/530, loss: 0.0070901173166930676 2023-01-22 19:17:29.799881: step: 368/530, loss: 0.0034733866341412067 2023-01-22 19:17:30.906267: step: 372/530, loss: 0.005018951371312141 2023-01-22 19:17:32.004914: step: 376/530, loss: 0.006167082116007805 2023-01-22 19:17:33.098448: step: 380/530, loss: 0.0006437755655497313 2023-01-22 19:17:34.197236: step: 384/530, loss: 0.01264442503452301 2023-01-22 19:17:35.305321: step: 388/530, loss: 0.004485584329813719 2023-01-22 19:17:36.403249: step: 392/530, loss: 0.0028374779503792524 2023-01-22 19:17:37.504210: step: 396/530, loss: 0.008006450720131397 2023-01-22 19:17:38.609369: step: 400/530, loss: 0.0039567346684634686 2023-01-22 19:17:39.695602: step: 404/530, loss: 0.003176835598424077 2023-01-22 19:17:40.809132: step: 408/530, loss: 0.009895380586385727 2023-01-22 19:17:41.919555: step: 412/530, loss: 0.004642541985958815 2023-01-22 19:17:43.026408: step: 416/530, loss: 0.0030829578172415495 2023-01-22 19:17:44.161798: step: 420/530, loss: 0.0018799740355461836 2023-01-22 19:17:45.252695: step: 424/530, loss: 0.001895493478514254 2023-01-22 19:17:46.344046: step: 428/530, loss: 0.0014667012728750706 2023-01-22 19:17:47.422521: step: 432/530, loss: 0.004194389097392559 2023-01-22 19:17:48.516495: step: 436/530, loss: 0.003689173609018326 2023-01-22 19:17:49.632113: step: 440/530, loss: 0.0014013617765158415 2023-01-22 19:17:50.709341: step: 444/530, loss: 0.00045999078429304063 2023-01-22 19:17:51.806334: step: 448/530, loss: 0.004100313875824213 2023-01-22 19:17:52.898044: step: 452/530, loss: 0.0009114727145060897 2023-01-22 19:17:54.005416: step: 456/530, loss: 0.00012237658665981144 2023-01-22 19:17:55.086119: step: 460/530, loss: 6.0865801060572267e-05 2023-01-22 19:17:56.191328: step: 464/530, loss: 0.0012575997970998287 2023-01-22 19:17:57.303331: step: 468/530, loss: 0.0057510011829435825 2023-01-22 19:17:58.422113: step: 472/530, loss: 0.003288004081696272 2023-01-22 19:17:59.542741: step: 476/530, loss: 0.0033185333013534546 2023-01-22 19:18:00.625530: step: 480/530, loss: 0.015662487596273422 2023-01-22 19:18:01.711410: step: 484/530, loss: 0.043038032948970795 2023-01-22 19:18:02.809229: step: 488/530, loss: 2.1868934709345922e-05 2023-01-22 19:18:03.911120: step: 492/530, loss: 0.004520669113844633 2023-01-22 19:18:04.999157: step: 496/530, loss: 0.016593074426054955 2023-01-22 19:18:06.106276: step: 500/530, loss: 0.007728383876383305 2023-01-22 19:18:07.191228: step: 504/530, loss: 0.003346404992043972 2023-01-22 19:18:08.277509: step: 508/530, loss: 0.003778420854359865 2023-01-22 19:18:09.365941: step: 512/530, loss: 0.0028398719150573015 2023-01-22 19:18:10.457930: step: 516/530, loss: 0.005659664981067181 2023-01-22 19:18:11.571454: step: 520/530, loss: 0.006070531904697418 2023-01-22 19:18:12.669098: step: 524/530, loss: 0.02036793902516365 2023-01-22 19:18:13.754913: step: 528/530, loss: 0.004326016176491976 2023-01-22 19:18:14.830722: step: 532/530, loss: 0.0004810047394130379 2023-01-22 19:18:15.935843: step: 536/530, loss: 0.0028727876488119364 2023-01-22 19:18:16.998512: step: 540/530, loss: 0.0032594348303973675 2023-01-22 19:18:18.077376: step: 544/530, loss: 0.0006257977220229805 2023-01-22 19:18:19.166327: step: 548/530, loss: 0.00021563086193054914 2023-01-22 19:18:20.262495: step: 552/530, loss: 0.013127956539392471 2023-01-22 19:18:21.373055: step: 556/530, loss: 0.008440916426479816 2023-01-22 19:18:22.464139: step: 560/530, loss: 0.005489332601428032 2023-01-22 19:18:23.572724: step: 564/530, loss: 0.0028305230662226677 2023-01-22 19:18:24.649749: step: 568/530, loss: 0.0012131185503676534 2023-01-22 19:18:25.772032: step: 572/530, loss: 0.010537172667682171 2023-01-22 19:18:26.889507: step: 576/530, loss: 0.01680556684732437 2023-01-22 19:18:27.989942: step: 580/530, loss: 0.006243174895644188 2023-01-22 19:18:29.075461: step: 584/530, loss: 4.402376362122595e-05 2023-01-22 19:18:30.188715: step: 588/530, loss: 0.005905324127525091 2023-01-22 19:18:31.290393: step: 592/530, loss: 0.008308203890919685 2023-01-22 19:18:32.395457: step: 596/530, loss: 0.00039306472172029316 2023-01-22 19:18:33.499243: step: 600/530, loss: 0.00035865072277374566 2023-01-22 19:18:34.600506: step: 604/530, loss: 0.006062301807105541 2023-01-22 19:18:35.700378: step: 608/530, loss: 0.0010942736407741904 2023-01-22 19:18:36.804889: step: 612/530, loss: 0.009786644019186497 2023-01-22 19:18:37.896694: step: 616/530, loss: 0.0025595512706786394 2023-01-22 19:18:38.984913: step: 620/530, loss: 0.0029115111101418734 2023-01-22 19:18:40.098074: step: 624/530, loss: 0.018040794879198074 2023-01-22 19:18:41.217969: step: 628/530, loss: 0.003304567653685808 2023-01-22 19:18:42.313475: step: 632/530, loss: 0.001293787150643766 2023-01-22 19:18:43.407720: step: 636/530, loss: 0.06879562884569168 2023-01-22 19:18:44.517472: step: 640/530, loss: 0.013498660176992416 2023-01-22 19:18:45.630747: step: 644/530, loss: 0.010204283520579338 2023-01-22 19:18:46.744253: step: 648/530, loss: 0.0028150181751698256 2023-01-22 19:18:47.832278: step: 652/530, loss: 0.004815452732145786 2023-01-22 19:18:48.960193: step: 656/530, loss: 0.00303437327966094 2023-01-22 19:18:50.058922: step: 660/530, loss: 0.0077403211034834385 2023-01-22 19:18:51.161627: step: 664/530, loss: 0.0003952081024181098 2023-01-22 19:18:52.268443: step: 668/530, loss: 0.017567165195941925 2023-01-22 19:18:53.366179: step: 672/530, loss: 0.0014099651016294956 2023-01-22 19:18:54.487904: step: 676/530, loss: 0.03357509896159172 2023-01-22 19:18:55.602892: step: 680/530, loss: 0.013304296880960464 2023-01-22 19:18:56.713540: step: 684/530, loss: 0.005183124914765358 2023-01-22 19:18:57.828706: step: 688/530, loss: 7.820197060937062e-05 2023-01-22 19:18:58.926132: step: 692/530, loss: 0.009638318791985512 2023-01-22 19:19:00.024531: step: 696/530, loss: 0.0012962538748979568 2023-01-22 19:19:01.096936: step: 700/530, loss: 0.0040832869708538055 2023-01-22 19:19:02.185001: step: 704/530, loss: 0.004653675947338343 2023-01-22 19:19:03.274129: step: 708/530, loss: 0.029797863215208054 2023-01-22 19:19:04.352576: step: 712/530, loss: 0.0036987420171499252 2023-01-22 19:19:05.420048: step: 716/530, loss: 0.003255095798522234 2023-01-22 19:19:06.506606: step: 720/530, loss: 0.0021511369850486517 2023-01-22 19:19:07.564857: step: 724/530, loss: 3.745911817532033e-05 2023-01-22 19:19:08.674246: step: 728/530, loss: 0.00893073808401823 2023-01-22 19:19:09.787138: step: 732/530, loss: 0.004155294504016638 2023-01-22 19:19:10.900869: step: 736/530, loss: 0.004102346021682024 2023-01-22 19:19:12.008341: step: 740/530, loss: 0.013285879977047443 2023-01-22 19:19:13.121361: step: 744/530, loss: 0.0017888894071802497 2023-01-22 19:19:14.195998: step: 748/530, loss: 1.5603556676069275e-05 2023-01-22 19:19:15.276986: step: 752/530, loss: 0.009007218293845654 2023-01-22 19:19:16.412447: step: 756/530, loss: 0.0008521409472450614 2023-01-22 19:19:17.510700: step: 760/530, loss: 0.006173994857817888 2023-01-22 19:19:18.597660: step: 764/530, loss: 0.024529192596673965 2023-01-22 19:19:19.677256: step: 768/530, loss: 0.0004677910765167326 2023-01-22 19:19:20.759522: step: 772/530, loss: 0.014223648235201836 2023-01-22 19:19:21.857478: step: 776/530, loss: 0.03586577996611595 2023-01-22 19:19:22.963476: step: 780/530, loss: 0.005227996036410332 2023-01-22 19:19:24.078542: step: 784/530, loss: 0.005863068159669638 2023-01-22 19:19:25.175050: step: 788/530, loss: 0.010787401348352432 2023-01-22 19:19:26.290665: step: 792/530, loss: 0.0038701503071933985 2023-01-22 19:19:27.390221: step: 796/530, loss: 0.0016628074226900935 2023-01-22 19:19:28.473663: step: 800/530, loss: 5.918848910368979e-05 2023-01-22 19:19:29.607634: step: 804/530, loss: 0.012087317183613777 2023-01-22 19:19:30.697699: step: 808/530, loss: 2.4346105419681408e-05 2023-01-22 19:19:31.781735: step: 812/530, loss: 0.01186387799680233 2023-01-22 19:19:32.889625: step: 816/530, loss: 0.0028141469229012728 2023-01-22 19:19:33.993677: step: 820/530, loss: 0.0012036864645779133 2023-01-22 19:19:35.139593: step: 824/530, loss: 0.006622304208576679 2023-01-22 19:19:36.234552: step: 828/530, loss: 0.0068290564231574535 2023-01-22 19:19:37.335721: step: 832/530, loss: 0.006145627237856388 2023-01-22 19:19:38.401339: step: 836/530, loss: 0.0054101282730698586 2023-01-22 19:19:39.508382: step: 840/530, loss: 0.0026045117992907763 2023-01-22 19:19:40.582673: step: 844/530, loss: 0.0038952401373535395 2023-01-22 19:19:41.682049: step: 848/530, loss: 0.010366232134401798 2023-01-22 19:19:42.788519: step: 852/530, loss: 9.185209637507796e-05 2023-01-22 19:19:43.858454: step: 856/530, loss: 0.009231075644493103 2023-01-22 19:19:44.948547: step: 860/530, loss: 0.004903125576674938 2023-01-22 19:19:46.048208: step: 864/530, loss: 0.006773474160581827 2023-01-22 19:19:47.120944: step: 868/530, loss: 0.0013201372930780053 2023-01-22 19:19:48.237310: step: 872/530, loss: 0.006256154738366604 2023-01-22 19:19:49.337035: step: 876/530, loss: 0.0016541752265766263 2023-01-22 19:19:50.412275: step: 880/530, loss: 6.33298791186121e-09 2023-01-22 19:19:51.503845: step: 884/530, loss: 0.00031882431358098984 2023-01-22 19:19:52.601991: step: 888/530, loss: 0.00876542367041111 2023-01-22 19:19:53.692788: step: 892/530, loss: 0.001780482823960483 2023-01-22 19:19:54.790418: step: 896/530, loss: 0.0004626884183380753 2023-01-22 19:19:55.872467: step: 900/530, loss: 0.003102170303463936 2023-01-22 19:19:56.972356: step: 904/530, loss: 0.012953349389135838 2023-01-22 19:19:58.065165: step: 908/530, loss: 0.0037548686377704144 2023-01-22 19:19:59.170899: step: 912/530, loss: 0.00599473062902689 2023-01-22 19:20:00.256752: step: 916/530, loss: 0.008263442665338516 2023-01-22 19:20:01.376127: step: 920/530, loss: 0.009791245684027672 2023-01-22 19:20:02.483392: step: 924/530, loss: 0.0007159954402595758 2023-01-22 19:20:03.607716: step: 928/530, loss: 0.0031552892178297043 2023-01-22 19:20:04.704495: step: 932/530, loss: 0.010926619172096252 2023-01-22 19:20:05.797567: step: 936/530, loss: 0.00016466010129079223 2023-01-22 19:20:06.875378: step: 940/530, loss: 0.004548830445855856 2023-01-22 19:20:07.956342: step: 944/530, loss: 1.2120547580707353e-05 2023-01-22 19:20:09.047104: step: 948/530, loss: 0.00046599801862612367 2023-01-22 19:20:10.134694: step: 952/530, loss: 0.02845151536166668 2023-01-22 19:20:11.212286: step: 956/530, loss: 0.005994254723191261 2023-01-22 19:20:12.290932: step: 960/530, loss: 0.006463390309363604 2023-01-22 19:20:13.413899: step: 964/530, loss: 8.653848453832325e-06 2023-01-22 19:20:14.512797: step: 968/530, loss: 0.004255854059010744 2023-01-22 19:20:15.644827: step: 972/530, loss: 0.00019908220565412194 2023-01-22 19:20:16.745201: step: 976/530, loss: 0.0021408952306956053 2023-01-22 19:20:17.836287: step: 980/530, loss: 0.0042573981918394566 2023-01-22 19:20:18.938022: step: 984/530, loss: 0.001045731594786048 2023-01-22 19:20:20.057368: step: 988/530, loss: 0.018463417887687683 2023-01-22 19:20:21.140934: step: 992/530, loss: 0.004368930123746395 2023-01-22 19:20:22.247170: step: 996/530, loss: 0.009772378951311111 2023-01-22 19:20:23.316600: step: 1000/530, loss: 1.3300714272190817e-06 2023-01-22 19:20:24.406002: step: 1004/530, loss: 0.007684438023716211 2023-01-22 19:20:25.504202: step: 1008/530, loss: 0.005854856222867966 2023-01-22 19:20:26.596938: step: 1012/530, loss: 0.0027198675088584423 2023-01-22 19:20:27.685779: step: 1016/530, loss: 0.0006460316362790763 2023-01-22 19:20:28.783141: step: 1020/530, loss: 0.010666060261428356 2023-01-22 19:20:29.895381: step: 1024/530, loss: 0.0020747161470353603 2023-01-22 19:20:31.002763: step: 1028/530, loss: 0.0006734076887369156 2023-01-22 19:20:32.094155: step: 1032/530, loss: 0.0025935957673937082 2023-01-22 19:20:33.181714: step: 1036/530, loss: 0.00029823408112861216 2023-01-22 19:20:34.273146: step: 1040/530, loss: 0.00022185847046785057 2023-01-22 19:20:35.360446: step: 1044/530, loss: 0.004975500516593456 2023-01-22 19:20:36.462274: step: 1048/530, loss: 0.0009544325876049697 2023-01-22 19:20:37.557829: step: 1052/530, loss: 0.0026594416704028845 2023-01-22 19:20:38.651273: step: 1056/530, loss: 0.0046880594454705715 2023-01-22 19:20:39.728113: step: 1060/530, loss: 0.0034318624529987574 2023-01-22 19:20:40.825022: step: 1064/530, loss: 0.004394009709358215 2023-01-22 19:20:41.934258: step: 1068/530, loss: 0.0017150972271338105 2023-01-22 19:20:43.018166: step: 1072/530, loss: 0.003705520648509264 2023-01-22 19:20:44.115085: step: 1076/530, loss: 0.00025791017105802894 2023-01-22 19:20:45.185268: step: 1080/530, loss: 0.008437520824372768 2023-01-22 19:20:46.267543: step: 1084/530, loss: 0.0018043089658021927 2023-01-22 19:20:47.374937: step: 1088/530, loss: 0.0013199786189943552 2023-01-22 19:20:48.477516: step: 1092/530, loss: 0.00043355507659725845 2023-01-22 19:20:49.565331: step: 1096/530, loss: 0.000349196809111163 2023-01-22 19:20:50.664517: step: 1100/530, loss: 0.009282906539738178 2023-01-22 19:20:51.749242: step: 1104/530, loss: 0.004893858451396227 2023-01-22 19:20:52.849061: step: 1108/530, loss: 0.0033122492022812366 2023-01-22 19:20:53.940767: step: 1112/530, loss: 0.002883948851376772 2023-01-22 19:20:55.018595: step: 1116/530, loss: 0.0036363275721669197 2023-01-22 19:20:56.133790: step: 1120/530, loss: 0.008871153928339481 2023-01-22 19:20:57.228930: step: 1124/530, loss: 7.155339699238539e-05 2023-01-22 19:20:58.299129: step: 1128/530, loss: 0.005794833414256573 2023-01-22 19:20:59.385684: step: 1132/530, loss: 0.005077144131064415 2023-01-22 19:21:00.479182: step: 1136/530, loss: 0.010705525986850262 2023-01-22 19:21:01.572159: step: 1140/530, loss: 0.009555460885167122 2023-01-22 19:21:02.661282: step: 1144/530, loss: 0.005552574992179871 2023-01-22 19:21:03.771020: step: 1148/530, loss: 0.0025734449736773968 2023-01-22 19:21:04.862155: step: 1152/530, loss: 0.0015987020451575518 2023-01-22 19:21:05.977530: step: 1156/530, loss: 0.00010630020551616326 2023-01-22 19:21:07.090464: step: 1160/530, loss: 0.0025307191535830498 2023-01-22 19:21:08.178751: step: 1164/530, loss: 0.0008618913707323372 2023-01-22 19:21:09.285066: step: 1168/530, loss: 0.006099597085267305 2023-01-22 19:21:10.368058: step: 1172/530, loss: 0.007948421873152256 2023-01-22 19:21:11.425306: step: 1176/530, loss: 0.0004808121011592448 2023-01-22 19:21:12.561567: step: 1180/530, loss: 0.0010332210222259164 2023-01-22 19:21:13.651995: step: 1184/530, loss: 0.0008535869419574738 2023-01-22 19:21:14.748000: step: 1188/530, loss: 0.006233790423721075 2023-01-22 19:21:15.854523: step: 1192/530, loss: 0.02192133106291294 2023-01-22 19:21:16.966881: step: 1196/530, loss: 0.011391752399504185 2023-01-22 19:21:18.057153: step: 1200/530, loss: 0.003326660254970193 2023-01-22 19:21:19.167237: step: 1204/530, loss: 0.000734316126909107 2023-01-22 19:21:20.274033: step: 1208/530, loss: 0.02097994275391102 2023-01-22 19:21:21.396373: step: 1212/530, loss: 0.00789344310760498 2023-01-22 19:21:22.485113: step: 1216/530, loss: 0.0050422088243067265 2023-01-22 19:21:23.614075: step: 1220/530, loss: 0.004294767510145903 2023-01-22 19:21:24.725549: step: 1224/530, loss: 0.006191391032189131 2023-01-22 19:21:25.810719: step: 1228/530, loss: 0.005577748641371727 2023-01-22 19:21:26.948853: step: 1232/530, loss: 0.004371450282633305 2023-01-22 19:21:28.057230: step: 1236/530, loss: 0.011765412986278534 2023-01-22 19:21:29.173899: step: 1240/530, loss: 0.000831493700388819 2023-01-22 19:21:30.276368: step: 1244/530, loss: 0.01249920204281807 2023-01-22 19:21:31.362865: step: 1248/530, loss: 0.019663171842694283 2023-01-22 19:21:32.442284: step: 1252/530, loss: 0.0018935668049380183 2023-01-22 19:21:33.518663: step: 1256/530, loss: 0.006387850269675255 2023-01-22 19:21:34.615381: step: 1260/530, loss: 0.0015770683530718088 2023-01-22 19:21:35.701120: step: 1264/530, loss: 0.005411600228399038 2023-01-22 19:21:36.787434: step: 1268/530, loss: 4.197704765829258e-05 2023-01-22 19:21:37.894603: step: 1272/530, loss: 0.01857392117381096 2023-01-22 19:21:38.965246: step: 1276/530, loss: 0.0004069058923050761 2023-01-22 19:21:40.048107: step: 1280/530, loss: 0.0006431051297113299 2023-01-22 19:21:41.148082: step: 1284/530, loss: 0.0032634944655001163 2023-01-22 19:21:42.242507: step: 1288/530, loss: 0.0011680993484333158 2023-01-22 19:21:43.314540: step: 1292/530, loss: 0.005447241012006998 2023-01-22 19:21:44.414375: step: 1296/530, loss: 0.005970741622149944 2023-01-22 19:21:45.511850: step: 1300/530, loss: 0.00038607389433309436 2023-01-22 19:21:46.635199: step: 1304/530, loss: 0.00487444456666708 2023-01-22 19:21:47.730485: step: 1308/530, loss: 0.005848734173923731 2023-01-22 19:21:48.819196: step: 1312/530, loss: 5.818076169816777e-05 2023-01-22 19:21:49.931579: step: 1316/530, loss: 0.0035178440157324076 2023-01-22 19:21:51.031163: step: 1320/530, loss: 0.0018739523366093636 2023-01-22 19:21:52.111711: step: 1324/530, loss: 0.0007567688589915633 2023-01-22 19:21:53.191094: step: 1328/530, loss: 0.006811899598687887 2023-01-22 19:21:54.259074: step: 1332/530, loss: 0.004004851449280977 2023-01-22 19:21:55.359188: step: 1336/530, loss: 0.004442003555595875 2023-01-22 19:21:56.476053: step: 1340/530, loss: 0.015975134447216988 2023-01-22 19:21:57.567544: step: 1344/530, loss: 0.0005995518295094371 2023-01-22 19:21:58.669700: step: 1348/530, loss: 0.0031597898341715336 2023-01-22 19:21:59.765704: step: 1352/530, loss: 0.004254691768437624 2023-01-22 19:22:00.880656: step: 1356/530, loss: 0.00034919148311018944 2023-01-22 19:22:01.979666: step: 1360/530, loss: 0.011843032203614712 2023-01-22 19:22:03.058910: step: 1364/530, loss: 0.0016121385851874948 2023-01-22 19:22:04.150723: step: 1368/530, loss: 0.0023107873275876045 2023-01-22 19:22:05.242815: step: 1372/530, loss: 0.0034817068371921778 2023-01-22 19:22:06.347569: step: 1376/530, loss: 0.002137373900040984 2023-01-22 19:22:07.435741: step: 1380/530, loss: 7.509499846491963e-05 2023-01-22 19:22:08.533673: step: 1384/530, loss: 0.004698347765952349 2023-01-22 19:22:09.627264: step: 1388/530, loss: 0.00018029357306659222 2023-01-22 19:22:10.719563: step: 1392/530, loss: 1.0746311090770178e-05 2023-01-22 19:22:11.820496: step: 1396/530, loss: 0.0019366234773769975 2023-01-22 19:22:12.908026: step: 1400/530, loss: 0.0004704426391981542 2023-01-22 19:22:13.993376: step: 1404/530, loss: 0.00199788436293602 2023-01-22 19:22:15.095648: step: 1408/530, loss: 0.0003137617895845324 2023-01-22 19:22:16.163499: step: 1412/530, loss: 0.0022457896266132593 2023-01-22 19:22:17.271911: step: 1416/530, loss: 0.00045267504174262285 2023-01-22 19:22:18.365036: step: 1420/530, loss: 0.0009092573309317231 2023-01-22 19:22:19.457895: step: 1424/530, loss: 0.0020866524428129196 2023-01-22 19:22:20.551401: step: 1428/530, loss: 0.0017698314040899277 2023-01-22 19:22:21.629464: step: 1432/530, loss: 0.013435174711048603 2023-01-22 19:22:22.733315: step: 1436/530, loss: 0.001993982819840312 2023-01-22 19:22:23.833520: step: 1440/530, loss: 0.011218621395528316 2023-01-22 19:22:24.933514: step: 1444/530, loss: 0.0002953499788418412 2023-01-22 19:22:26.045529: step: 1448/530, loss: 0.011713948100805283 2023-01-22 19:22:27.119818: step: 1452/530, loss: 0.0015478963032364845 2023-01-22 19:22:28.222086: step: 1456/530, loss: 0.0025427218060940504 2023-01-22 19:22:29.317087: step: 1460/530, loss: 0.0034042673651129007 2023-01-22 19:22:30.428146: step: 1464/530, loss: 0.0023622673470526934 2023-01-22 19:22:31.510870: step: 1468/530, loss: 0.0025987448170781136 2023-01-22 19:22:32.642445: step: 1472/530, loss: 0.0009625330567359924 2023-01-22 19:22:33.730848: step: 1476/530, loss: 0.002376854419708252 2023-01-22 19:22:34.818306: step: 1480/530, loss: 0.012599444016814232 2023-01-22 19:22:35.910468: step: 1484/530, loss: 0.00047750273370184004 2023-01-22 19:22:37.015425: step: 1488/530, loss: 0.001846915460191667 2023-01-22 19:22:38.099666: step: 1492/530, loss: 0.006273969076573849 2023-01-22 19:22:39.206309: step: 1496/530, loss: 0.001010268577374518 2023-01-22 19:22:40.315087: step: 1500/530, loss: 0.006716223433613777 2023-01-22 19:22:41.391006: step: 1504/530, loss: 0.008409428410232067 2023-01-22 19:22:42.487933: step: 1508/530, loss: 0.004951608367264271 2023-01-22 19:22:43.590879: step: 1512/530, loss: 0.000355736498022452 2023-01-22 19:22:44.679973: step: 1516/530, loss: 0.0029275112319737673 2023-01-22 19:22:45.772971: step: 1520/530, loss: 0.005963629111647606 2023-01-22 19:22:46.880153: step: 1524/530, loss: 0.0038211403880268335 2023-01-22 19:22:47.965719: step: 1528/530, loss: 0.001565816579386592 2023-01-22 19:22:49.062062: step: 1532/530, loss: 0.012257400900125504 2023-01-22 19:22:50.159035: step: 1536/530, loss: 0.01185611356049776 2023-01-22 19:22:51.232779: step: 1540/530, loss: 0.0008904370479285717 2023-01-22 19:22:52.307023: step: 1544/530, loss: 0.00985379982739687 2023-01-22 19:22:53.365219: step: 1548/530, loss: 0.0004087619890924543 2023-01-22 19:22:54.467213: step: 1552/530, loss: 0.005597870796918869 2023-01-22 19:22:55.545878: step: 1556/530, loss: 0.015355966053903103 2023-01-22 19:22:56.670352: step: 1560/530, loss: 0.0043082330375909805 2023-01-22 19:22:57.762608: step: 1564/530, loss: 0.004766838625073433 2023-01-22 19:22:58.840783: step: 1568/530, loss: 0.00024223816581070423 2023-01-22 19:22:59.939340: step: 1572/530, loss: 0.006220538634806871 2023-01-22 19:23:01.035877: step: 1576/530, loss: 0.00019033053831662983 2023-01-22 19:23:02.123179: step: 1580/530, loss: 0.0019313825760036707 2023-01-22 19:23:03.200734: step: 1584/530, loss: 0.01158900000154972 2023-01-22 19:23:04.298081: step: 1588/530, loss: 0.009623370133340359 2023-01-22 19:23:05.385586: step: 1592/530, loss: 0.006437897682189941 2023-01-22 19:23:06.469900: step: 1596/530, loss: 0.0010151652386412024 2023-01-22 19:23:07.561257: step: 1600/530, loss: 0.004753860179334879 2023-01-22 19:23:08.648729: step: 1604/530, loss: 0.01348473783582449 2023-01-22 19:23:09.766580: step: 1608/530, loss: 0.002250124467536807 2023-01-22 19:23:10.854746: step: 1612/530, loss: 0.007330153603106737 2023-01-22 19:23:11.965242: step: 1616/530, loss: 0.007058130577206612 2023-01-22 19:23:13.065167: step: 1620/530, loss: 0.0014252610271796584 2023-01-22 19:23:14.144323: step: 1624/530, loss: 0.007356412708759308 2023-01-22 19:23:15.229768: step: 1628/530, loss: 0.00017888860020320863 2023-01-22 19:23:16.315652: step: 1632/530, loss: 0.0006667135166935623 2023-01-22 19:23:17.395435: step: 1636/530, loss: 0.011095312424004078 2023-01-22 19:23:18.488903: step: 1640/530, loss: 0.002226361073553562 2023-01-22 19:23:19.594083: step: 1644/530, loss: 0.01689758151769638 2023-01-22 19:23:20.689382: step: 1648/530, loss: 0.0012102712644264102 2023-01-22 19:23:21.790229: step: 1652/530, loss: 8.18850749055855e-05 2023-01-22 19:23:22.884383: step: 1656/530, loss: 1.2423811313055921e-05 2023-01-22 19:23:23.976890: step: 1660/530, loss: 0.003003004938364029 2023-01-22 19:23:25.088966: step: 1664/530, loss: 0.005219044629484415 2023-01-22 19:23:26.186223: step: 1668/530, loss: 0.020767422392964363 2023-01-22 19:23:27.281880: step: 1672/530, loss: 0.003036527195945382 2023-01-22 19:23:28.359704: step: 1676/530, loss: 1.7686797946225852e-06 2023-01-22 19:23:29.448925: step: 1680/530, loss: 0.007433051709085703 2023-01-22 19:23:30.533186: step: 1684/530, loss: 0.029139313846826553 2023-01-22 19:23:31.686604: step: 1688/530, loss: 0.0010811605025082827 2023-01-22 19:23:32.818874: step: 1692/530, loss: 0.011061285622417927 2023-01-22 19:23:33.914042: step: 1696/530, loss: 0.02029518224298954 2023-01-22 19:23:35.032822: step: 1700/530, loss: 0.00505274161696434 2023-01-22 19:23:36.149071: step: 1704/530, loss: 0.00032734230626374483 2023-01-22 19:23:37.246956: step: 1708/530, loss: 0.009157164953649044 2023-01-22 19:23:38.367664: step: 1712/530, loss: 0.0028398402500897646 2023-01-22 19:23:39.462367: step: 1716/530, loss: 0.017813021317124367 2023-01-22 19:23:40.561002: step: 1720/530, loss: 0.002479216083884239 2023-01-22 19:23:41.673415: step: 1724/530, loss: 0.01330887246876955 2023-01-22 19:23:42.785912: step: 1728/530, loss: 0.019950294867157936 2023-01-22 19:23:43.907506: step: 1732/530, loss: 0.006393796298652887 2023-01-22 19:23:44.995837: step: 1736/530, loss: 0.0022322724107652903 2023-01-22 19:23:46.103914: step: 1740/530, loss: 0.008349602110683918 2023-01-22 19:23:47.198478: step: 1744/530, loss: 0.006456011440604925 2023-01-22 19:23:48.308227: step: 1748/530, loss: 0.005218730308115482 2023-01-22 19:23:49.419577: step: 1752/530, loss: 0.0004118007782381028 2023-01-22 19:23:50.517338: step: 1756/530, loss: 7.621573604410514e-05 2023-01-22 19:23:51.630634: step: 1760/530, loss: 4.565552080748603e-05 2023-01-22 19:23:52.728238: step: 1764/530, loss: 0.002926686080172658 2023-01-22 19:23:53.836960: step: 1768/530, loss: 0.015068943612277508 2023-01-22 19:23:54.932176: step: 1772/530, loss: 0.0015271228039637208 2023-01-22 19:23:56.015832: step: 1776/530, loss: 0.0038208412006497383 2023-01-22 19:23:57.106578: step: 1780/530, loss: 0.004268140997737646 2023-01-22 19:23:58.196564: step: 1784/530, loss: 0.0007785434718243778 2023-01-22 19:23:59.283487: step: 1788/530, loss: 0.0037303471472114325 2023-01-22 19:24:00.386545: step: 1792/530, loss: 0.005979621782898903 2023-01-22 19:24:01.502071: step: 1796/530, loss: 0.002793046645820141 2023-01-22 19:24:02.608560: step: 1800/530, loss: 0.012062052264809608 2023-01-22 19:24:03.699896: step: 1804/530, loss: 0.0011541249696165323 2023-01-22 19:24:04.819368: step: 1808/530, loss: 0.007963895797729492 2023-01-22 19:24:05.915597: step: 1812/530, loss: 0.0011873121839016676 2023-01-22 19:24:07.012496: step: 1816/530, loss: 0.007192743010818958 2023-01-22 19:24:08.108561: step: 1820/530, loss: 0.0008395753684453666 2023-01-22 19:24:09.185618: step: 1824/530, loss: 0.00234224577434361 2023-01-22 19:24:10.280432: step: 1828/530, loss: 0.0017208369681611657 2023-01-22 19:24:11.385084: step: 1832/530, loss: 0.002837186912074685 2023-01-22 19:24:12.497853: step: 1836/530, loss: 0.0008313122089020908 2023-01-22 19:24:13.585107: step: 1840/530, loss: 0.00895564816892147 2023-01-22 19:24:14.711135: step: 1844/530, loss: 0.0036113779060542583 2023-01-22 19:24:15.804264: step: 1848/530, loss: 0.007410169579088688 2023-01-22 19:24:16.893550: step: 1852/530, loss: 0.007057948503643274 2023-01-22 19:24:17.988512: step: 1856/530, loss: 0.007463072892278433 2023-01-22 19:24:19.078208: step: 1860/530, loss: 0.00016262877034023404 2023-01-22 19:24:20.176909: step: 1864/530, loss: 0.0015687368577346206 2023-01-22 19:24:21.261432: step: 1868/530, loss: 0.0016334542306140065 2023-01-22 19:24:22.337812: step: 1872/530, loss: 0.016074128448963165 2023-01-22 19:24:23.456971: step: 1876/530, loss: 0.00044986631837673485 2023-01-22 19:24:24.542323: step: 1880/530, loss: 0.019057132303714752 2023-01-22 19:24:25.641464: step: 1884/530, loss: 0.012813219800591469 2023-01-22 19:24:26.706637: step: 1888/530, loss: 0.0030455824453383684 2023-01-22 19:24:27.809680: step: 1892/530, loss: 0.003639615373685956 2023-01-22 19:24:28.897824: step: 1896/530, loss: 0.010136867873370647 2023-01-22 19:24:29.989485: step: 1900/530, loss: 0.0009270050213672221 2023-01-22 19:24:31.108400: step: 1904/530, loss: 0.0039407857693731785 2023-01-22 19:24:32.201848: step: 1908/530, loss: 0.007624221034348011 2023-01-22 19:24:33.283369: step: 1912/530, loss: 0.00032158478279598057 2023-01-22 19:24:34.380955: step: 1916/530, loss: 0.001729368232190609 2023-01-22 19:24:35.472641: step: 1920/530, loss: 0.0038076473865658045 2023-01-22 19:24:36.554689: step: 1924/530, loss: 0.014754346571862698 2023-01-22 19:24:37.632423: step: 1928/530, loss: 0.001312493928708136 2023-01-22 19:24:38.716781: step: 1932/530, loss: 0.0017326330998912454 2023-01-22 19:24:39.815770: step: 1936/530, loss: 0.0005827595014125109 2023-01-22 19:24:40.899648: step: 1940/530, loss: 0.023289987817406654 2023-01-22 19:24:42.036929: step: 1944/530, loss: 0.005664709024131298 2023-01-22 19:24:43.137901: step: 1948/530, loss: 0.003145907074213028 2023-01-22 19:24:44.226925: step: 1952/530, loss: 0.002479083836078644 2023-01-22 19:24:45.323108: step: 1956/530, loss: 0.0008014517952688038 2023-01-22 19:24:46.422224: step: 1960/530, loss: 0.004337603226304054 2023-01-22 19:24:47.524454: step: 1964/530, loss: 0.00604652613401413 2023-01-22 19:24:48.619779: step: 1968/530, loss: 0.003832897637039423 2023-01-22 19:24:49.724919: step: 1972/530, loss: 0.0075946287252008915 2023-01-22 19:24:50.790789: step: 1976/530, loss: 0.009812133386731148 2023-01-22 19:24:51.916528: step: 1980/530, loss: 0.007179032079875469 2023-01-22 19:24:53.007931: step: 1984/530, loss: 0.0017271579708904028 2023-01-22 19:24:54.139288: step: 1988/530, loss: 0.0038227015174925327 2023-01-22 19:24:55.243427: step: 1992/530, loss: 7.549358997493982e-05 2023-01-22 19:24:56.360256: step: 1996/530, loss: 6.163866714814503e-07 2023-01-22 19:24:57.465867: step: 2000/530, loss: 0.010236179456114769 2023-01-22 19:24:58.574117: step: 2004/530, loss: 0.005936293862760067 2023-01-22 19:24:59.671617: step: 2008/530, loss: 0.0025672833435237408 2023-01-22 19:25:00.780328: step: 2012/530, loss: 0.0037847773637622595 2023-01-22 19:25:01.879067: step: 2016/530, loss: 0.00466605881229043 2023-01-22 19:25:02.992447: step: 2020/530, loss: 0.0016953644808381796 2023-01-22 19:25:04.099379: step: 2024/530, loss: 0.014948712661862373 2023-01-22 19:25:05.189171: step: 2028/530, loss: 0.0059296446852386 2023-01-22 19:25:06.276363: step: 2032/530, loss: 0.001659872941672802 2023-01-22 19:25:07.396278: step: 2036/530, loss: 0.0009222202352248132 2023-01-22 19:25:08.492821: step: 2040/530, loss: 0.006768266204744577 2023-01-22 19:25:09.595148: step: 2044/530, loss: 0.003870441345497966 2023-01-22 19:25:10.726846: step: 2048/530, loss: 0.0004518051282502711 2023-01-22 19:25:11.874526: step: 2052/530, loss: 0.0002215412532677874 2023-01-22 19:25:12.967589: step: 2056/530, loss: 0.004906861577183008 2023-01-22 19:25:14.062433: step: 2060/530, loss: 0.0025891445111483335 2023-01-22 19:25:15.144058: step: 2064/530, loss: 0.012634353712201118 2023-01-22 19:25:16.244828: step: 2068/530, loss: 0.009332558140158653 2023-01-22 19:25:17.333604: step: 2072/530, loss: 0.004877055063843727 2023-01-22 19:25:18.436531: step: 2076/530, loss: 0.002650513779371977 2023-01-22 19:25:19.540310: step: 2080/530, loss: 0.0016186363063752651 2023-01-22 19:25:20.646521: step: 2084/530, loss: 0.07312414795160294 2023-01-22 19:25:21.767478: step: 2088/530, loss: 0.003823396749794483 2023-01-22 19:25:22.865602: step: 2092/530, loss: 0.00966161023825407 2023-01-22 19:25:23.975155: step: 2096/530, loss: 0.002313487231731415 2023-01-22 19:25:25.065456: step: 2100/530, loss: 0.0001693515368970111 2023-01-22 19:25:26.169570: step: 2104/530, loss: 0.010704522021114826 2023-01-22 19:25:27.264373: step: 2108/530, loss: 0.00025611446471884847 2023-01-22 19:25:28.381742: step: 2112/530, loss: 0.004219945054501295 2023-01-22 19:25:29.494881: step: 2116/530, loss: 0.0009405352175235748 2023-01-22 19:25:30.580467: step: 2120/530, loss: 0.004256460350006819 ================================================== Loss: 0.006 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3395630289817902, 'r': 0.3588929926809433, 'f1': 0.3489605297838692}, 'combined': 0.25712881141969307, 'stategy': 1, 'epoch': 11} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3375376289678138, 'r': 0.2877917271713704, 'f1': 0.3106859969783828}, 'combined': 0.19295235601815353, 'stategy': 1, 'epoch': 11} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34763654625437984, 'r': 0.3436786349118252, 'f1': 0.34564626068422116}, 'combined': 0.2546867183988998, 'stategy': 1, 'epoch': 11} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.32501668097194036, 'r': 0.2893323569483149, 'f1': 0.30613816104107416}, 'combined': 0.1901279105412987, 'stategy': 1, 'epoch': 11} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33980827437688704, 'r': 0.3275571221697507, 'f1': 0.333570248083978}, 'combined': 0.2457886038513522, 'stategy': 1, 'epoch': 11} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3480855563857105, 'r': 0.2958555420020698, 'f1': 0.3198523629115227}, 'combined': 0.1986451517029457, 'stategy': 1, 'epoch': 11} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 11} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 11} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 11} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 12 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 19:28:05.081538: step: 4/530, loss: 0.0013282769359648228 2023-01-22 19:28:06.195232: step: 8/530, loss: 0.0007166077848523855 2023-01-22 19:28:07.293938: step: 12/530, loss: 0.0026112738996744156 2023-01-22 19:28:08.369796: step: 16/530, loss: 0.002682651858776808 2023-01-22 19:28:09.454423: step: 20/530, loss: 0.011102957651019096 2023-01-22 19:28:10.562404: step: 24/530, loss: 0.006892113015055656 2023-01-22 19:28:11.679198: step: 28/530, loss: 0.012931205332279205 2023-01-22 19:28:12.789488: step: 32/530, loss: 0.0017117051174864173 2023-01-22 19:28:13.860191: step: 36/530, loss: 0.004092513117939234 2023-01-22 19:28:14.937717: step: 40/530, loss: 0.009882969781756401 2023-01-22 19:28:16.046865: step: 44/530, loss: 0.0014846251579001546 2023-01-22 19:28:17.126480: step: 48/530, loss: 0.00927084218710661 2023-01-22 19:28:18.219675: step: 52/530, loss: 0.004552260506898165 2023-01-22 19:28:19.306984: step: 56/530, loss: 0.0007692054496146739 2023-01-22 19:28:20.400312: step: 60/530, loss: 0.00425350246950984 2023-01-22 19:28:21.499198: step: 64/530, loss: 0.0004158757801633328 2023-01-22 19:28:22.589199: step: 68/530, loss: 0.022751739248633385 2023-01-22 19:28:23.698259: step: 72/530, loss: 0.008947727270424366 2023-01-22 19:28:24.787482: step: 76/530, loss: 0.0019416005816310644 2023-01-22 19:28:25.877065: step: 80/530, loss: 0.004187324084341526 2023-01-22 19:28:26.968117: step: 84/530, loss: 0.004844694398343563 2023-01-22 19:28:28.061441: step: 88/530, loss: 0.0013403381453827024 2023-01-22 19:28:29.169776: step: 92/530, loss: 0.003545124549418688 2023-01-22 19:28:30.248286: step: 96/530, loss: 0.003108375705778599 2023-01-22 19:28:31.350380: step: 100/530, loss: 0.0016596417408436537 2023-01-22 19:28:32.454713: step: 104/530, loss: 0.007822801358997822 2023-01-22 19:28:33.595145: step: 108/530, loss: 0.00777782266959548 2023-01-22 19:28:34.680648: step: 112/530, loss: 0.0015431058127433062 2023-01-22 19:28:35.772290: step: 116/530, loss: 0.0021872520446777344 2023-01-22 19:28:36.845780: step: 120/530, loss: 0.0036428936291486025 2023-01-22 19:28:37.950110: step: 124/530, loss: 0.005377375520765781 2023-01-22 19:28:39.037309: step: 128/530, loss: 0.0025357420090585947 2023-01-22 19:28:40.137587: step: 132/530, loss: 0.02607816830277443 2023-01-22 19:28:41.226984: step: 136/530, loss: 0.013520168140530586 2023-01-22 19:28:42.324671: step: 140/530, loss: 0.004857353866100311 2023-01-22 19:28:43.402243: step: 144/530, loss: 0.008640473708510399 2023-01-22 19:28:44.490056: step: 148/530, loss: 0.00011588572670007125 2023-01-22 19:28:45.561870: step: 152/530, loss: 0.02487765997648239 2023-01-22 19:28:46.661780: step: 156/530, loss: 0.0005496989469975233 2023-01-22 19:28:47.775361: step: 160/530, loss: 0.1543724536895752 2023-01-22 19:28:48.859206: step: 164/530, loss: 0.03956758230924606 2023-01-22 19:28:49.938995: step: 168/530, loss: 0.0032563696149736643 2023-01-22 19:28:51.014601: step: 172/530, loss: 0.0015266978880390525 2023-01-22 19:28:52.116273: step: 176/530, loss: 0.0021048292983323336 2023-01-22 19:28:53.202884: step: 180/530, loss: 0.004921151790767908 2023-01-22 19:28:54.319287: step: 184/530, loss: 0.005682270508259535 2023-01-22 19:28:55.410687: step: 188/530, loss: 0.0022502427455037832 2023-01-22 19:28:56.501327: step: 192/530, loss: 1.6228532331297174e-05 2023-01-22 19:28:57.613784: step: 196/530, loss: 0.0027154642157256603 2023-01-22 19:28:58.718302: step: 200/530, loss: 0.002484674099832773 2023-01-22 19:28:59.807682: step: 204/530, loss: 0.0002948844921775162 2023-01-22 19:29:00.928811: step: 208/530, loss: 0.0031943190842866898 2023-01-22 19:29:02.009244: step: 212/530, loss: 8.710770634934306e-05 2023-01-22 19:29:03.112151: step: 216/530, loss: 0.0020512444898486137 2023-01-22 19:29:04.198007: step: 220/530, loss: 0.017200758680701256 2023-01-22 19:29:05.280392: step: 224/530, loss: 0.01049842406064272 2023-01-22 19:29:06.387802: step: 228/530, loss: 0.0007387291407212615 2023-01-22 19:29:07.491692: step: 232/530, loss: 0.000985565478913486 2023-01-22 19:29:08.580377: step: 236/530, loss: 0.0007848618552088737 2023-01-22 19:29:09.686836: step: 240/530, loss: 0.001021631876938045 2023-01-22 19:29:10.766633: step: 244/530, loss: 0.000648330373223871 2023-01-22 19:29:11.862303: step: 248/530, loss: 0.004050981253385544 2023-01-22 19:29:12.924927: step: 252/530, loss: 0.0004885526141151786 2023-01-22 19:29:14.012885: step: 256/530, loss: 0.0004767110222019255 2023-01-22 19:29:15.095702: step: 260/530, loss: 0.0030144068878144026 2023-01-22 19:29:16.186413: step: 264/530, loss: 0.004344135522842407 2023-01-22 19:29:17.297805: step: 268/530, loss: 0.008200027979910374 2023-01-22 19:29:18.362456: step: 272/530, loss: 0.001755343982949853 2023-01-22 19:29:19.468698: step: 276/530, loss: 0.010060666128993034 2023-01-22 19:29:20.588613: step: 280/530, loss: 0.003028949024155736 2023-01-22 19:29:21.668390: step: 284/530, loss: 0.0060416641645133495 2023-01-22 19:29:22.758568: step: 288/530, loss: 0.000583796645514667 2023-01-22 19:29:23.851695: step: 292/530, loss: 0.005627032835036516 2023-01-22 19:29:24.934496: step: 296/530, loss: 0.0018009231425821781 2023-01-22 19:29:26.028208: step: 300/530, loss: 0.0006026829360052943 2023-01-22 19:29:27.118957: step: 304/530, loss: 0.001971691381186247 2023-01-22 19:29:28.238247: step: 308/530, loss: 0.0015901505248621106 2023-01-22 19:29:29.328433: step: 312/530, loss: 0.005434457678347826 2023-01-22 19:29:30.419417: step: 316/530, loss: 0.003684228053316474 2023-01-22 19:29:31.529218: step: 320/530, loss: 0.0007053037988953292 2023-01-22 19:29:32.617696: step: 324/530, loss: 0.004026405513286591 2023-01-22 19:29:33.718806: step: 328/530, loss: 0.008272100239992142 2023-01-22 19:29:34.811586: step: 332/530, loss: 0.0007523755193687975 2023-01-22 19:29:35.915310: step: 336/530, loss: 0.0008887725416570902 2023-01-22 19:29:37.005639: step: 340/530, loss: 0.0002869265154004097 2023-01-22 19:29:38.079261: step: 344/530, loss: 0.001409532269462943 2023-01-22 19:29:39.167750: step: 348/530, loss: 0.0014691234100610018 2023-01-22 19:29:40.252731: step: 352/530, loss: 0.003308819606900215 2023-01-22 19:29:41.337751: step: 356/530, loss: 0.0070055099204182625 2023-01-22 19:29:42.426828: step: 360/530, loss: 0.003059013281017542 2023-01-22 19:29:43.536758: step: 364/530, loss: 0.007416489068418741 2023-01-22 19:29:44.612489: step: 368/530, loss: 0.0035310243256390095 2023-01-22 19:29:45.709104: step: 372/530, loss: 0.0044801486656069756 2023-01-22 19:29:46.800262: step: 376/530, loss: 0.005069028586149216 2023-01-22 19:29:47.898636: step: 380/530, loss: 0.002067211549729109 2023-01-22 19:29:48.985402: step: 384/530, loss: 0.003478986443951726 2023-01-22 19:29:50.067223: step: 388/530, loss: 0.01598384976387024 2023-01-22 19:29:51.161203: step: 392/530, loss: 0.00575635302811861 2023-01-22 19:29:52.257970: step: 396/530, loss: 0.002196107292547822 2023-01-22 19:29:53.377417: step: 400/530, loss: 0.0021438344847410917 2023-01-22 19:29:54.490627: step: 404/530, loss: 0.006238223053514957 2023-01-22 19:29:55.608643: step: 408/530, loss: 0.007764538284391165 2023-01-22 19:29:56.714413: step: 412/530, loss: 0.0026912125758826733 2023-01-22 19:29:57.819726: step: 416/530, loss: 0.010484520345926285 2023-01-22 19:29:58.920760: step: 420/530, loss: 5.424030314316042e-05 2023-01-22 19:30:00.012871: step: 424/530, loss: 0.0010154732735827565 2023-01-22 19:30:01.096701: step: 428/530, loss: 0.002305225934833288 2023-01-22 19:30:02.209370: step: 432/530, loss: 0.0016883363714441657 2023-01-22 19:30:03.294175: step: 436/530, loss: 0.0029265927150845528 2023-01-22 19:30:04.377898: step: 440/530, loss: 0.0022073877044022083 2023-01-22 19:30:05.465088: step: 444/530, loss: 0.0016494240844622254 2023-01-22 19:30:06.541249: step: 448/530, loss: 0.0059205531142652035 2023-01-22 19:30:07.662548: step: 452/530, loss: 0.00023701814643573016 2023-01-22 19:30:08.739218: step: 456/530, loss: 0.0005892252665944397 2023-01-22 19:30:09.825742: step: 460/530, loss: 0.006177544128149748 2023-01-22 19:30:10.933227: step: 464/530, loss: 0.0038924363907426596 2023-01-22 19:30:12.039680: step: 468/530, loss: 0.005065560340881348 2023-01-22 19:30:13.155871: step: 472/530, loss: 0.007990981452167034 2023-01-22 19:30:14.236988: step: 476/530, loss: 0.0005420101806521416 2023-01-22 19:30:15.315965: step: 480/530, loss: 0.0004488943668548018 2023-01-22 19:30:16.376413: step: 484/530, loss: 0.003811345435678959 2023-01-22 19:30:17.479145: step: 488/530, loss: 0.00531365629285574 2023-01-22 19:30:18.586590: step: 492/530, loss: 0.004253334831446409 2023-01-22 19:30:19.717591: step: 496/530, loss: 0.0015755154890939593 2023-01-22 19:30:20.811191: step: 500/530, loss: 0.003367781639099121 2023-01-22 19:30:21.904430: step: 504/530, loss: 0.006671552546322346 2023-01-22 19:30:23.001032: step: 508/530, loss: 0.005226884502917528 2023-01-22 19:30:24.113622: step: 512/530, loss: 0.024795377627015114 2023-01-22 19:30:25.209417: step: 516/530, loss: 2.29196803047671e-06 2023-01-22 19:30:26.312743: step: 520/530, loss: 0.011250624433159828 2023-01-22 19:30:27.413384: step: 524/530, loss: 0.003432190278545022 2023-01-22 19:30:28.518074: step: 528/530, loss: 0.009041900746524334 2023-01-22 19:30:29.612983: step: 532/530, loss: 3.596556416596286e-05 2023-01-22 19:30:30.692619: step: 536/530, loss: 0.011411798186600208 2023-01-22 19:30:31.809332: step: 540/530, loss: 0.004180583171546459 2023-01-22 19:30:32.871320: step: 544/530, loss: 5.783369124401361e-05 2023-01-22 19:30:33.960919: step: 548/530, loss: 0.011810092255473137 2023-01-22 19:30:35.074230: step: 552/530, loss: 0.0012022400042042136 2023-01-22 19:30:36.174893: step: 556/530, loss: 0.0031371568329632282 2023-01-22 19:30:37.294956: step: 560/530, loss: 0.0029107872396707535 2023-01-22 19:30:38.400777: step: 564/530, loss: 0.00022597539646085352 2023-01-22 19:30:39.502644: step: 568/530, loss: 0.0030135330744087696 2023-01-22 19:30:40.588683: step: 572/530, loss: 0.00741279823705554 2023-01-22 19:30:41.698087: step: 576/530, loss: 0.007068963255733252 2023-01-22 19:30:42.816209: step: 580/530, loss: 0.00439951429143548 2023-01-22 19:30:43.912359: step: 584/530, loss: 0.0007739784196019173 2023-01-22 19:30:45.016125: step: 588/530, loss: 0.009545059874653816 2023-01-22 19:30:46.099361: step: 592/530, loss: 0.02392938733100891 2023-01-22 19:30:47.180937: step: 596/530, loss: 0.0012618659529834986 2023-01-22 19:30:48.281212: step: 600/530, loss: 0.002825401956215501 2023-01-22 19:30:49.380753: step: 604/530, loss: 0.003480615559965372 2023-01-22 19:30:50.479337: step: 608/530, loss: 0.011056671850383282 2023-01-22 19:30:51.568374: step: 612/530, loss: 5.0333917897660285e-05 2023-01-22 19:30:52.665765: step: 616/530, loss: 0.012612312100827694 2023-01-22 19:30:53.756139: step: 620/530, loss: 0.0015372501220554113 2023-01-22 19:30:54.858299: step: 624/530, loss: 0.0004818023007828742 2023-01-22 19:30:55.932236: step: 628/530, loss: 0.012534980662167072 2023-01-22 19:30:57.061336: step: 632/530, loss: 0.0032857495825737715 2023-01-22 19:30:58.151398: step: 636/530, loss: 0.0020048515871167183 2023-01-22 19:30:59.228563: step: 640/530, loss: 0.0015880591236054897 2023-01-22 19:31:00.321239: step: 644/530, loss: 0.001628233352676034 2023-01-22 19:31:01.417238: step: 648/530, loss: 0.008483968675136566 2023-01-22 19:31:02.506008: step: 652/530, loss: 0.0010150448651984334 2023-01-22 19:31:03.589198: step: 656/530, loss: 0.0006647915579378605 2023-01-22 19:31:04.676920: step: 660/530, loss: 0.004456573165953159 2023-01-22 19:31:05.755673: step: 664/530, loss: 0.0014632751699537039 2023-01-22 19:31:06.837585: step: 668/530, loss: 0.00010278318222844973 2023-01-22 19:31:07.921817: step: 672/530, loss: 0.0002867642615456134 2023-01-22 19:31:09.001039: step: 676/530, loss: 0.0008807194535620511 2023-01-22 19:31:10.093216: step: 680/530, loss: 0.006089372094720602 2023-01-22 19:31:11.175679: step: 684/530, loss: 0.012407553382217884 2023-01-22 19:31:12.280463: step: 688/530, loss: 0.0006447809282690287 2023-01-22 19:31:13.355553: step: 692/530, loss: 0.0009658485651016235 2023-01-22 19:31:14.413836: step: 696/530, loss: 0.00035205602762289345 2023-01-22 19:31:15.512919: step: 700/530, loss: 0.001657846150919795 2023-01-22 19:31:16.621535: step: 704/530, loss: 3.839066994260065e-05 2023-01-22 19:31:17.722151: step: 708/530, loss: 0.002620797138661146 2023-01-22 19:31:18.803133: step: 712/530, loss: 0.01476196013391018 2023-01-22 19:31:19.886651: step: 716/530, loss: 0.014402851462364197 2023-01-22 19:31:20.985324: step: 720/530, loss: 0.00914725847542286 2023-01-22 19:31:22.114671: step: 724/530, loss: 0.0015775400679558516 2023-01-22 19:31:23.194659: step: 728/530, loss: 0.011741344816982746 2023-01-22 19:31:24.293605: step: 732/530, loss: 0.008535072207450867 2023-01-22 19:31:25.362241: step: 736/530, loss: 0.00040210349834524095 2023-01-22 19:31:26.478192: step: 740/530, loss: 0.01881117932498455 2023-01-22 19:31:27.567343: step: 744/530, loss: 0.0036962665617465973 2023-01-22 19:31:28.673250: step: 748/530, loss: 0.0022431055549532175 2023-01-22 19:31:29.782841: step: 752/530, loss: 0.002346399240195751 2023-01-22 19:31:30.884006: step: 756/530, loss: 3.1254390364665596e-07 2023-01-22 19:31:31.972200: step: 760/530, loss: 0.000602013140451163 2023-01-22 19:31:33.049205: step: 764/530, loss: 0.008635367266833782 2023-01-22 19:31:34.137448: step: 768/530, loss: 0.0007458119071088731 2023-01-22 19:31:35.228943: step: 772/530, loss: 0.019908368587493896 2023-01-22 19:31:36.335077: step: 776/530, loss: 0.005076912697404623 2023-01-22 19:31:37.412079: step: 780/530, loss: 0.005201888270676136 2023-01-22 19:31:38.516693: step: 784/530, loss: 0.023236414417624474 2023-01-22 19:31:39.616320: step: 788/530, loss: 0.005887606181204319 2023-01-22 19:31:40.726714: step: 792/530, loss: 0.00021235259191598743 2023-01-22 19:31:41.843504: step: 796/530, loss: 0.00024718864005990326 2023-01-22 19:31:42.957672: step: 800/530, loss: 0.0196321252733469 2023-01-22 19:31:44.042107: step: 804/530, loss: 0.0012177644530311227 2023-01-22 19:31:45.133765: step: 808/530, loss: 0.0032924406696110964 2023-01-22 19:31:46.203922: step: 812/530, loss: 0.00010472331632627174 2023-01-22 19:31:47.313478: step: 816/530, loss: 0.003384908428415656 2023-01-22 19:31:48.398901: step: 820/530, loss: 0.006923796609044075 2023-01-22 19:31:49.504216: step: 824/530, loss: 0.0029404230881482363 2023-01-22 19:31:50.595404: step: 828/530, loss: 0.003901845309883356 2023-01-22 19:31:51.695514: step: 832/530, loss: 0.0022908365353941917 2023-01-22 19:31:52.789474: step: 836/530, loss: 0.004797129426151514 2023-01-22 19:31:53.878007: step: 840/530, loss: 0.004384325817227364 2023-01-22 19:31:54.964584: step: 844/530, loss: 0.00028739136178046465 2023-01-22 19:31:56.067542: step: 848/530, loss: 0.00015839732077438384 2023-01-22 19:31:57.164427: step: 852/530, loss: 0.003454955294728279 2023-01-22 19:31:58.278502: step: 856/530, loss: 0.01841742917895317 2023-01-22 19:31:59.365868: step: 860/530, loss: 0.0020822861697524786 2023-01-22 19:32:00.465234: step: 864/530, loss: 0.007027497049421072 2023-01-22 19:32:01.569439: step: 868/530, loss: 0.0006082684849388897 2023-01-22 19:32:02.654618: step: 872/530, loss: 0.0018352603074163198 2023-01-22 19:32:03.759343: step: 876/530, loss: 0.004127270542085171 2023-01-22 19:32:04.853905: step: 880/530, loss: 0.001196317607536912 2023-01-22 19:32:05.945231: step: 884/530, loss: 0.005441926419734955 2023-01-22 19:32:07.019842: step: 888/530, loss: 0.005609191954135895 2023-01-22 19:32:08.102694: step: 892/530, loss: 0.0005249209934845567 2023-01-22 19:32:09.199311: step: 896/530, loss: 0.0036400395911186934 2023-01-22 19:32:10.313099: step: 900/530, loss: 0.008705930784344673 2023-01-22 19:32:11.404823: step: 904/530, loss: 9.220934771292377e-06 2023-01-22 19:32:12.525168: step: 908/530, loss: 9.59230019361712e-05 2023-01-22 19:32:13.620607: step: 912/530, loss: 0.000316394871333614 2023-01-22 19:32:14.715204: step: 916/530, loss: 0.007739558815956116 2023-01-22 19:32:15.812639: step: 920/530, loss: 0.0030269413255155087 2023-01-22 19:32:16.901679: step: 924/530, loss: 0.0014082634588703513 2023-01-22 19:32:18.003594: step: 928/530, loss: 0.0033085395116358995 2023-01-22 19:32:19.069164: step: 932/530, loss: 4.4718261051457375e-05 2023-01-22 19:32:20.155054: step: 936/530, loss: 0.0029728920198976994 2023-01-22 19:32:21.248054: step: 940/530, loss: 0.00013389321975409985 2023-01-22 19:32:22.347216: step: 944/530, loss: 0.0038787336088716984 2023-01-22 19:32:23.448931: step: 948/530, loss: 0.024764133617281914 2023-01-22 19:32:24.555327: step: 952/530, loss: 0.002442519413307309 2023-01-22 19:32:25.627398: step: 956/530, loss: 0.00785348005592823 2023-01-22 19:32:26.726461: step: 960/530, loss: 0.00306137977167964 2023-01-22 19:32:27.818456: step: 964/530, loss: 0.0036833484191447496 2023-01-22 19:32:28.913504: step: 968/530, loss: 0.0027110674418509007 2023-01-22 19:32:30.007774: step: 972/530, loss: 0.0007943974924273789 2023-01-22 19:32:31.097405: step: 976/530, loss: 0.00847509317100048 2023-01-22 19:32:32.188057: step: 980/530, loss: 0.000861790613271296 2023-01-22 19:32:33.282381: step: 984/530, loss: 0.008168418891727924 2023-01-22 19:32:34.356840: step: 988/530, loss: 0.0033762722741812468 2023-01-22 19:32:35.429526: step: 992/530, loss: 0.0015345296123996377 2023-01-22 19:32:36.510579: step: 996/530, loss: 0.0008810081635601819 2023-01-22 19:32:37.590207: step: 1000/530, loss: 0.0014387140981853008 2023-01-22 19:32:38.668426: step: 1004/530, loss: 0.003929978236556053 2023-01-22 19:32:39.747053: step: 1008/530, loss: 0.0015910568181425333 2023-01-22 19:32:40.829675: step: 1012/530, loss: 5.263879575068131e-05 2023-01-22 19:32:41.923958: step: 1016/530, loss: 0.0036562897730618715 2023-01-22 19:32:43.019584: step: 1020/530, loss: 0.004044460132718086 2023-01-22 19:32:44.116520: step: 1024/530, loss: 0.0004481390060391277 2023-01-22 19:32:45.245857: step: 1028/530, loss: 0.005939308553934097 2023-01-22 19:32:46.332253: step: 1032/530, loss: 0.0025205567944794893 2023-01-22 19:32:47.457687: step: 1036/530, loss: 0.0003851708024740219 2023-01-22 19:32:48.558157: step: 1040/530, loss: 0.00394230242818594 2023-01-22 19:32:49.628749: step: 1044/530, loss: 0.000790725345723331 2023-01-22 19:32:50.715317: step: 1048/530, loss: 0.0006547352531924844 2023-01-22 19:32:51.809404: step: 1052/530, loss: 0.0002145062608178705 2023-01-22 19:32:52.901803: step: 1056/530, loss: 0.0035680169239640236 2023-01-22 19:32:53.982554: step: 1060/530, loss: 0.005521649960428476 2023-01-22 19:32:55.059810: step: 1064/530, loss: 0.006090599112212658 2023-01-22 19:32:56.148656: step: 1068/530, loss: 0.003495714860036969 2023-01-22 19:32:57.258479: step: 1072/530, loss: 0.0023991423659026623 2023-01-22 19:32:58.359459: step: 1076/530, loss: 0.011029968038201332 2023-01-22 19:32:59.447462: step: 1080/530, loss: 0.01628875732421875 2023-01-22 19:33:00.524605: step: 1084/530, loss: 0.0026841729413717985 2023-01-22 19:33:01.601941: step: 1088/530, loss: 0.004322941415011883 2023-01-22 19:33:02.692430: step: 1092/530, loss: 0.0005825699190609157 2023-01-22 19:33:03.780211: step: 1096/530, loss: 0.004924403969198465 2023-01-22 19:33:04.855992: step: 1100/530, loss: 0.0009734384948387742 2023-01-22 19:33:05.934536: step: 1104/530, loss: 0.003486888948827982 2023-01-22 19:33:07.000202: step: 1108/530, loss: 0.0007589052547700703 2023-01-22 19:33:08.083829: step: 1112/530, loss: 0.0017122741555795074 2023-01-22 19:33:09.153607: step: 1116/530, loss: 0.005499228835105896 2023-01-22 19:33:10.234329: step: 1120/530, loss: 0.0005945372977294028 2023-01-22 19:33:11.330646: step: 1124/530, loss: 0.01989840343594551 2023-01-22 19:33:12.419088: step: 1128/530, loss: 0.0009664539247751236 2023-01-22 19:33:13.489374: step: 1132/530, loss: 3.013615810232295e-07 2023-01-22 19:33:14.576960: step: 1136/530, loss: 0.025590527802705765 2023-01-22 19:33:15.678505: step: 1140/530, loss: 0.01024713832885027 2023-01-22 19:33:16.765655: step: 1144/530, loss: 0.004431177396327257 2023-01-22 19:33:17.852915: step: 1148/530, loss: 0.006881935056298971 2023-01-22 19:33:18.901494: step: 1152/530, loss: 0.0009120499598793685 2023-01-22 19:33:20.014692: step: 1156/530, loss: 0.007891872897744179 2023-01-22 19:33:21.106597: step: 1160/530, loss: 0.006422643084079027 2023-01-22 19:33:22.183753: step: 1164/530, loss: 0.0015579741448163986 2023-01-22 19:33:23.267946: step: 1168/530, loss: 0.0005016556242480874 2023-01-22 19:33:24.336630: step: 1172/530, loss: 0.002956017618998885 2023-01-22 19:33:25.434636: step: 1176/530, loss: 0.0021321908570826054 2023-01-22 19:33:26.519492: step: 1180/530, loss: 0.000456401874544099 2023-01-22 19:33:27.607853: step: 1184/530, loss: 0.0027978145517408848 2023-01-22 19:33:28.727003: step: 1188/530, loss: 0.006141733843833208 2023-01-22 19:33:29.802298: step: 1192/530, loss: 0.00030454795341938734 2023-01-22 19:33:30.876077: step: 1196/530, loss: 0.0036493183579295874 2023-01-22 19:33:31.959072: step: 1200/530, loss: 0.005128855351358652 2023-01-22 19:33:33.040621: step: 1204/530, loss: 5.0108679715776816e-05 2023-01-22 19:33:34.188412: step: 1208/530, loss: 0.007080928888171911 2023-01-22 19:33:35.269305: step: 1212/530, loss: 0.0006423405138775706 2023-01-22 19:33:36.357228: step: 1216/530, loss: 0.006253702566027641 2023-01-22 19:33:37.452466: step: 1220/530, loss: 0.0038436076138168573 2023-01-22 19:33:38.550716: step: 1224/530, loss: 0.0012389343464747071 2023-01-22 19:33:39.653320: step: 1228/530, loss: 0.0011327725369483232 2023-01-22 19:33:40.740331: step: 1232/530, loss: 0.005476536229252815 2023-01-22 19:33:41.832443: step: 1236/530, loss: 0.0015993707347661257 2023-01-22 19:33:42.925490: step: 1240/530, loss: 0.0023863338865339756 2023-01-22 19:33:44.003336: step: 1244/530, loss: 0.00957927294075489 2023-01-22 19:33:45.089485: step: 1248/530, loss: 0.022871652618050575 2023-01-22 19:33:46.202079: step: 1252/530, loss: 0.0021960516460239887 2023-01-22 19:33:47.281223: step: 1256/530, loss: 0.00020496989600360394 2023-01-22 19:33:48.372589: step: 1260/530, loss: 0.000734953791834414 2023-01-22 19:33:49.508535: step: 1264/530, loss: 0.003913666121661663 2023-01-22 19:33:50.639294: step: 1268/530, loss: 0.017393719404935837 2023-01-22 19:33:51.765803: step: 1272/530, loss: 0.0032708507496863604 2023-01-22 19:33:52.862267: step: 1276/530, loss: 0.01114897895604372 2023-01-22 19:33:53.988768: step: 1280/530, loss: 0.002834647661074996 2023-01-22 19:33:55.105387: step: 1284/530, loss: 0.00044656184036284685 2023-01-22 19:33:56.173932: step: 1288/530, loss: 0.011877741664648056 2023-01-22 19:33:57.259976: step: 1292/530, loss: 0.0023644077591598034 2023-01-22 19:33:58.346307: step: 1296/530, loss: 0.015803668648004532 2023-01-22 19:33:59.437086: step: 1300/530, loss: 0.0004333755059633404 2023-01-22 19:34:00.545991: step: 1304/530, loss: 0.008682974614202976 2023-01-22 19:34:01.664528: step: 1308/530, loss: 0.0015222133370116353 2023-01-22 19:34:02.758513: step: 1312/530, loss: 0.0018281691009178758 2023-01-22 19:34:03.864722: step: 1316/530, loss: 0.0005714896251447499 2023-01-22 19:34:04.952693: step: 1320/530, loss: 0.05201597511768341 2023-01-22 19:34:06.065806: step: 1324/530, loss: 8.254409476649016e-05 2023-01-22 19:34:07.152417: step: 1328/530, loss: 0.003138340078294277 2023-01-22 19:34:08.235039: step: 1332/530, loss: 0.0019122665980830789 2023-01-22 19:34:09.309673: step: 1336/530, loss: 0.00042591485544107854 2023-01-22 19:34:10.405149: step: 1340/530, loss: 0.00829241331666708 2023-01-22 19:34:11.507428: step: 1344/530, loss: 0.003200522856786847 2023-01-22 19:34:12.626358: step: 1348/530, loss: 0.0108566889539361 2023-01-22 19:34:13.736391: step: 1352/530, loss: 0.007357567548751831 2023-01-22 19:34:14.809351: step: 1356/530, loss: 0.005130159668624401 2023-01-22 19:34:15.909577: step: 1360/530, loss: 0.002784601878374815 2023-01-22 19:34:17.023598: step: 1364/530, loss: 0.0018567726947367191 2023-01-22 19:34:18.134507: step: 1368/530, loss: 0.001946165575645864 2023-01-22 19:34:19.221360: step: 1372/530, loss: 0.0021874376107007265 2023-01-22 19:34:20.311113: step: 1376/530, loss: 0.007368598598986864 2023-01-22 19:34:21.387306: step: 1380/530, loss: 0.007469009142369032 2023-01-22 19:34:22.487353: step: 1384/530, loss: 0.003102353308349848 2023-01-22 19:34:23.580665: step: 1388/530, loss: 0.0004759367147926241 2023-01-22 19:34:24.675228: step: 1392/530, loss: 0.0029485838022083044 2023-01-22 19:34:25.766632: step: 1396/530, loss: 0.003538076998665929 2023-01-22 19:34:26.874556: step: 1400/530, loss: 0.00025586719857528806 2023-01-22 19:34:27.969575: step: 1404/530, loss: 0.005292871966958046 2023-01-22 19:34:29.050557: step: 1408/530, loss: 0.0009659806964918971 2023-01-22 19:34:30.140550: step: 1412/530, loss: 0.007447524461895227 2023-01-22 19:34:31.245331: step: 1416/530, loss: 0.001783325569704175 2023-01-22 19:34:32.328628: step: 1420/530, loss: 0.00785510428249836 2023-01-22 19:34:33.430951: step: 1424/530, loss: 0.003746903734281659 2023-01-22 19:34:34.524481: step: 1428/530, loss: 0.0013054126175120473 2023-01-22 19:34:35.618013: step: 1432/530, loss: 0.008335101418197155 2023-01-22 19:34:36.713285: step: 1436/530, loss: 0.03604024276137352 2023-01-22 19:34:37.809224: step: 1440/530, loss: 0.003660415532067418 2023-01-22 19:34:38.912192: step: 1444/530, loss: 0.0074257622472941875 2023-01-22 19:34:39.985991: step: 1448/530, loss: 0.007867055013775826 2023-01-22 19:34:41.070619: step: 1452/530, loss: 0.015310634858906269 2023-01-22 19:34:42.151250: step: 1456/530, loss: 0.013803989626467228 2023-01-22 19:34:43.241588: step: 1460/530, loss: 0.006369090173393488 2023-01-22 19:34:44.338698: step: 1464/530, loss: 0.0008969185873866081 2023-01-22 19:34:45.433142: step: 1468/530, loss: 0.004128504544496536 2023-01-22 19:34:46.513278: step: 1472/530, loss: 0.008057482540607452 2023-01-22 19:34:47.596658: step: 1476/530, loss: 0.0013072536094114184 2023-01-22 19:34:48.663018: step: 1480/530, loss: 0.014017199166119099 2023-01-22 19:34:49.765339: step: 1484/530, loss: 0.05971527844667435 2023-01-22 19:34:50.857292: step: 1488/530, loss: 0.005062997341156006 2023-01-22 19:34:51.956367: step: 1492/530, loss: 0.0024659796617925167 2023-01-22 19:34:53.026789: step: 1496/530, loss: 9.569990879754187e-07 2023-01-22 19:34:54.115288: step: 1500/530, loss: 0.006207902915775776 2023-01-22 19:34:55.233337: step: 1504/530, loss: 0.002065556589514017 2023-01-22 19:34:56.340640: step: 1508/530, loss: 0.001768824178725481 2023-01-22 19:34:57.442095: step: 1512/530, loss: 0.002064608968794346 2023-01-22 19:34:58.536293: step: 1516/530, loss: 0.0009590198751538992 2023-01-22 19:34:59.609661: step: 1520/530, loss: 0.0027619139291346073 2023-01-22 19:35:00.714110: step: 1524/530, loss: 0.005965469870716333 2023-01-22 19:35:01.798253: step: 1528/530, loss: 0.0005408466677181423 2023-01-22 19:35:02.907241: step: 1532/530, loss: 0.004232795909047127 2023-01-22 19:35:04.007467: step: 1536/530, loss: 0.029255446046590805 2023-01-22 19:35:05.092015: step: 1540/530, loss: 0.001512959599494934 2023-01-22 19:35:06.184898: step: 1544/530, loss: 0.004193993750959635 2023-01-22 19:35:07.276926: step: 1548/530, loss: 0.01655593328177929 2023-01-22 19:35:08.357634: step: 1552/530, loss: 0.004010556731373072 2023-01-22 19:35:09.457646: step: 1556/530, loss: 0.00477555999532342 2023-01-22 19:35:10.553992: step: 1560/530, loss: 0.0030332282185554504 2023-01-22 19:35:11.632880: step: 1564/530, loss: 0.004279244691133499 2023-01-22 19:35:12.698468: step: 1568/530, loss: 0.002007303759455681 2023-01-22 19:35:13.790116: step: 1572/530, loss: 0.0029593987856060266 2023-01-22 19:35:14.895899: step: 1576/530, loss: 0.0020100378897041082 2023-01-22 19:35:15.988442: step: 1580/530, loss: 0.009585062973201275 2023-01-22 19:35:17.112272: step: 1584/530, loss: 0.010612668469548225 2023-01-22 19:35:18.191746: step: 1588/530, loss: 0.003532403614372015 2023-01-22 19:35:19.314372: step: 1592/530, loss: 0.004616458900272846 2023-01-22 19:35:20.399722: step: 1596/530, loss: 0.00012834652443416417 2023-01-22 19:35:21.469268: step: 1600/530, loss: 0.008451024070382118 2023-01-22 19:35:22.561644: step: 1604/530, loss: 0.003901928663253784 2023-01-22 19:35:23.667467: step: 1608/530, loss: 0.0076681217178702354 2023-01-22 19:35:24.737803: step: 1612/530, loss: 0.0027105221524834633 2023-01-22 19:35:25.833894: step: 1616/530, loss: 0.0029793232679367065 2023-01-22 19:35:26.902677: step: 1620/530, loss: 0.002083100378513336 2023-01-22 19:35:28.003684: step: 1624/530, loss: 0.0014758487232029438 2023-01-22 19:35:29.089354: step: 1628/530, loss: 0.018433067947626114 2023-01-22 19:35:30.202879: step: 1632/530, loss: 0.0008275517611764371 2023-01-22 19:35:31.290568: step: 1636/530, loss: 0.004098664037883282 2023-01-22 19:35:32.380292: step: 1640/530, loss: 4.538245775620453e-06 2023-01-22 19:35:33.506487: step: 1644/530, loss: 0.004451615270227194 2023-01-22 19:35:34.591445: step: 1648/530, loss: 0.009558179415762424 2023-01-22 19:35:35.651066: step: 1652/530, loss: 0.0010312829399481416 2023-01-22 19:35:36.728542: step: 1656/530, loss: 0.00029791021370328963 2023-01-22 19:35:37.795615: step: 1660/530, loss: 0.0012415312230587006 2023-01-22 19:35:38.868119: step: 1664/530, loss: 0.00031093659345060587 2023-01-22 19:35:39.975191: step: 1668/530, loss: 0.006347445771098137 2023-01-22 19:35:41.061447: step: 1672/530, loss: 0.010725405067205429 2023-01-22 19:35:42.144195: step: 1676/530, loss: 0.0025757949333637953 2023-01-22 19:35:43.236533: step: 1680/530, loss: 1.4211590496415738e-05 2023-01-22 19:35:44.331613: step: 1684/530, loss: 0.004520696122199297 2023-01-22 19:35:45.437876: step: 1688/530, loss: 0.008326796814799309 2023-01-22 19:35:46.534873: step: 1692/530, loss: 9.182773646898568e-05 2023-01-22 19:35:47.611850: step: 1696/530, loss: 0.002773266052827239 2023-01-22 19:35:48.683701: step: 1700/530, loss: 0.001968016382306814 2023-01-22 19:35:49.799209: step: 1704/530, loss: 0.004385901615023613 2023-01-22 19:35:50.889142: step: 1708/530, loss: 0.011045076884329319 2023-01-22 19:35:51.980343: step: 1712/530, loss: 0.0030012561473995447 2023-01-22 19:35:53.072810: step: 1716/530, loss: 0.002662105718627572 2023-01-22 19:35:54.150366: step: 1720/530, loss: 0.004749532323330641 2023-01-22 19:35:55.247639: step: 1724/530, loss: 0.0022050482220947742 2023-01-22 19:35:56.343749: step: 1728/530, loss: 0.007212100084871054 2023-01-22 19:35:57.426342: step: 1732/530, loss: 0.013577912002801895 2023-01-22 19:35:58.527577: step: 1736/530, loss: 0.008280695416033268 2023-01-22 19:35:59.614899: step: 1740/530, loss: 0.002290676813572645 2023-01-22 19:36:00.707194: step: 1744/530, loss: 0.001719155116006732 2023-01-22 19:36:01.796731: step: 1748/530, loss: 0.006506065838038921 2023-01-22 19:36:02.928015: step: 1752/530, loss: 0.0069944956339895725 2023-01-22 19:36:04.018948: step: 1756/530, loss: 0.0027302296366542578 2023-01-22 19:36:05.111085: step: 1760/530, loss: 0.004053385928273201 2023-01-22 19:36:06.213203: step: 1764/530, loss: 0.0018323834519833326 2023-01-22 19:36:07.316413: step: 1768/530, loss: 0.00046504868078045547 2023-01-22 19:36:08.404430: step: 1772/530, loss: 0.0003045002813450992 2023-01-22 19:36:09.502913: step: 1776/530, loss: 0.0041580963879823685 2023-01-22 19:36:10.622124: step: 1780/530, loss: 0.0015695146284997463 2023-01-22 19:36:11.713037: step: 1784/530, loss: 0.0016330681974068284 2023-01-22 19:36:12.825547: step: 1788/530, loss: 0.0005462969420477748 2023-01-22 19:36:13.918306: step: 1792/530, loss: 0.0029472154565155506 2023-01-22 19:36:14.988318: step: 1796/530, loss: 0.005171945318579674 2023-01-22 19:36:16.098210: step: 1800/530, loss: 0.008737027645111084 2023-01-22 19:36:17.196463: step: 1804/530, loss: 0.004143659025430679 2023-01-22 19:36:18.295540: step: 1808/530, loss: 0.004884339869022369 2023-01-22 19:36:19.391309: step: 1812/530, loss: 0.007590312045067549 2023-01-22 19:36:20.503195: step: 1816/530, loss: 0.0003040601732209325 2023-01-22 19:36:21.610835: step: 1820/530, loss: 0.0021880995482206345 2023-01-22 19:36:22.706121: step: 1824/530, loss: 0.05034518241882324 2023-01-22 19:36:23.784836: step: 1828/530, loss: 0.0027692888397723436 2023-01-22 19:36:24.882901: step: 1832/530, loss: 0.007986345328390598 2023-01-22 19:36:25.970641: step: 1836/530, loss: 0.005478563718497753 2023-01-22 19:36:27.071982: step: 1840/530, loss: 0.008761007338762283 2023-01-22 19:36:28.151650: step: 1844/530, loss: 0.0007668921607546508 2023-01-22 19:36:29.261159: step: 1848/530, loss: 1.3191502148401923e-05 2023-01-22 19:36:30.343236: step: 1852/530, loss: 0.0008549068588763475 2023-01-22 19:36:31.442229: step: 1856/530, loss: 0.00013868896348867565 2023-01-22 19:36:32.533690: step: 1860/530, loss: 0.012111968360841274 2023-01-22 19:36:33.626460: step: 1864/530, loss: 0.002229460049420595 2023-01-22 19:36:34.738437: step: 1868/530, loss: 0.005779405124485493 2023-01-22 19:36:35.807216: step: 1872/530, loss: 0.0007654499495401978 2023-01-22 19:36:36.880835: step: 1876/530, loss: 0.0004401237238198519 2023-01-22 19:36:37.977480: step: 1880/530, loss: 0.01065981574356556 2023-01-22 19:36:39.058216: step: 1884/530, loss: 0.012769266963005066 2023-01-22 19:36:40.154792: step: 1888/530, loss: 0.001921915914863348 2023-01-22 19:36:41.248290: step: 1892/530, loss: 0.01803373172879219 2023-01-22 19:36:42.375581: step: 1896/530, loss: 0.011836661025881767 2023-01-22 19:36:43.473359: step: 1900/530, loss: 0.013509376905858517 2023-01-22 19:36:44.538214: step: 1904/530, loss: 0.013414420187473297 2023-01-22 19:36:45.660822: step: 1908/530, loss: 0.00331012811511755 2023-01-22 19:36:46.731435: step: 1912/530, loss: 0.0012118967715650797 2023-01-22 19:36:47.820062: step: 1916/530, loss: 0.0028175697661936283 2023-01-22 19:36:48.901808: step: 1920/530, loss: 0.0021286497358232737 2023-01-22 19:36:50.005713: step: 1924/530, loss: 0.00033343781251460314 2023-01-22 19:36:51.109440: step: 1928/530, loss: 0.006572900805622339 2023-01-22 19:36:52.201915: step: 1932/530, loss: 0.003769731381908059 2023-01-22 19:36:53.299247: step: 1936/530, loss: 0.010479830205440521 2023-01-22 19:36:54.409497: step: 1940/530, loss: 0.004546172916889191 2023-01-22 19:36:55.484967: step: 1944/530, loss: 0.0014573668595403433 2023-01-22 19:36:56.559426: step: 1948/530, loss: 0.001883357996121049 2023-01-22 19:36:57.639851: step: 1952/530, loss: 0.023197341710329056 2023-01-22 19:36:58.735374: step: 1956/530, loss: 0.0 2023-01-22 19:36:59.826409: step: 1960/530, loss: 0.004750645253807306 2023-01-22 19:37:00.916526: step: 1964/530, loss: 0.0015845161397010088 2023-01-22 19:37:01.991519: step: 1968/530, loss: 0.014294756576418877 2023-01-22 19:37:03.113784: step: 1972/530, loss: 0.0022179039660841227 2023-01-22 19:37:04.213981: step: 1976/530, loss: 0.0037082417402416468 2023-01-22 19:37:05.287403: step: 1980/530, loss: 0.005503215827047825 2023-01-22 19:37:06.402175: step: 1984/530, loss: 0.0035996742080897093 2023-01-22 19:37:07.501726: step: 1988/530, loss: 0.009086393751204014 2023-01-22 19:37:08.608982: step: 1992/530, loss: 0.0027807424776256084 2023-01-22 19:37:09.691469: step: 1996/530, loss: 0.0007474375306628644 2023-01-22 19:37:10.805894: step: 2000/530, loss: 0.00048265905934385955 2023-01-22 19:37:11.902720: step: 2004/530, loss: 0.0018520974554121494 2023-01-22 19:37:12.992509: step: 2008/530, loss: 0.0010032663121819496 2023-01-22 19:37:14.099874: step: 2012/530, loss: 0.005230959039181471 2023-01-22 19:37:15.183995: step: 2016/530, loss: 0.003999687731266022 2023-01-22 19:37:16.279380: step: 2020/530, loss: 0.00028858802397735417 2023-01-22 19:37:17.381410: step: 2024/530, loss: 0.003560730954632163 2023-01-22 19:37:18.466136: step: 2028/530, loss: 0.010231171734631062 2023-01-22 19:37:19.548281: step: 2032/530, loss: 0.0019173513865098357 2023-01-22 19:37:20.628814: step: 2036/530, loss: 0.007335932459682226 2023-01-22 19:37:21.716780: step: 2040/530, loss: 0.010403071530163288 2023-01-22 19:37:22.821203: step: 2044/530, loss: 0.00016546566621400416 2023-01-22 19:37:23.891595: step: 2048/530, loss: 0.003771527437493205 2023-01-22 19:37:24.999970: step: 2052/530, loss: 0.006769419647753239 2023-01-22 19:37:26.107003: step: 2056/530, loss: 0.04177527502179146 2023-01-22 19:37:27.198389: step: 2060/530, loss: 0.002998405834659934 2023-01-22 19:37:28.302691: step: 2064/530, loss: 0.0029434487223625183 2023-01-22 19:37:29.382790: step: 2068/530, loss: 0.0033542837481945753 2023-01-22 19:37:30.481176: step: 2072/530, loss: 0.010070827789604664 2023-01-22 19:37:31.583351: step: 2076/530, loss: 0.004673119634389877 2023-01-22 19:37:32.678257: step: 2080/530, loss: 0.009197418577969074 2023-01-22 19:37:33.768280: step: 2084/530, loss: 0.0038647225592285395 2023-01-22 19:37:34.848196: step: 2088/530, loss: 0.003918979782611132 2023-01-22 19:37:35.922088: step: 2092/530, loss: 0.004716282710433006 2023-01-22 19:37:37.021985: step: 2096/530, loss: 0.003306119702756405 2023-01-22 19:37:38.113914: step: 2100/530, loss: 0.003941201604902744 2023-01-22 19:37:39.215889: step: 2104/530, loss: 0.0023030757438391447 2023-01-22 19:37:40.298784: step: 2108/530, loss: 0.01321802195161581 2023-01-22 19:37:41.378758: step: 2112/530, loss: 0.006373906508088112 2023-01-22 19:37:42.487740: step: 2116/530, loss: 0.007655682973563671 2023-01-22 19:37:43.572339: step: 2120/530, loss: 0.005693155340850353 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33431780630401625, 'r': 0.35652107617240447, 'f1': 0.3450626393808212}, 'combined': 0.25425668164902615, 'stategy': 1, 'epoch': 12} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3320406844664242, 'r': 0.28606076772527744, 'f1': 0.3073405272797614}, 'combined': 0.1908746432579571, 'stategy': 1, 'epoch': 12} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34638200115102286, 'r': 0.3417811017049941, 'f1': 0.3440661711528785}, 'combined': 0.253522441902121, 'stategy': 1, 'epoch': 12} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.321830882164218, 'r': 0.28808798057232177, 'f1': 0.304026042127993}, 'combined': 0.188816173532122, 'stategy': 1, 'epoch': 12} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33636339248712327, 'r': 0.32423643905779626, 'f1': 0.3301886055719007}, 'combined': 0.24329686726350577, 'stategy': 1, 'epoch': 12} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3465216520279545, 'r': 0.2948683751708754, 'f1': 0.3186151083179699}, 'combined': 0.1978767514816866, 'stategy': 1, 'epoch': 12} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 12} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.35294117647058826, 'r': 0.5217391304347826, 'f1': 0.4210526315789474}, 'combined': 0.2105263157894737, 'stategy': 1, 'epoch': 12} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 12} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 13 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 19:40:16.922995: step: 4/530, loss: 0.0009382517891936004 2023-01-22 19:40:18.005681: step: 8/530, loss: 0.0007458329200744629 2023-01-22 19:40:19.086513: step: 12/530, loss: 0.020100224763154984 2023-01-22 19:40:20.174062: step: 16/530, loss: 0.00603818753734231 2023-01-22 19:40:21.241994: step: 20/530, loss: 0.0023992632050067186 2023-01-22 19:40:22.335542: step: 24/530, loss: 8.95670018508099e-05 2023-01-22 19:40:23.405950: step: 28/530, loss: 0.00046150924754329026 2023-01-22 19:40:24.482291: step: 32/530, loss: 0.0008870534948073328 2023-01-22 19:40:25.558631: step: 36/530, loss: 0.005683777388185263 2023-01-22 19:40:26.664251: step: 40/530, loss: 0.0015970487147569656 2023-01-22 19:40:27.752228: step: 44/530, loss: 0.001628810539841652 2023-01-22 19:40:28.851048: step: 48/530, loss: 0.004171023610979319 2023-01-22 19:40:29.948085: step: 52/530, loss: 5.571292422246188e-05 2023-01-22 19:40:31.045367: step: 56/530, loss: 5.181822780286893e-05 2023-01-22 19:40:32.147374: step: 60/530, loss: 2.9268907383084297e-05 2023-01-22 19:40:33.224341: step: 64/530, loss: 0.0008482362609356642 2023-01-22 19:40:34.307233: step: 68/530, loss: 0.00347668188624084 2023-01-22 19:40:35.387927: step: 72/530, loss: 7.646776793990284e-05 2023-01-22 19:40:36.459418: step: 76/530, loss: 0.000637854915112257 2023-01-22 19:40:37.543437: step: 80/530, loss: 0.0012868506601080298 2023-01-22 19:40:38.650547: step: 84/530, loss: 0.0014965353766456246 2023-01-22 19:40:39.718933: step: 88/530, loss: 0.00263797864317894 2023-01-22 19:40:40.808295: step: 92/530, loss: 0.0011093398788943887 2023-01-22 19:40:41.943973: step: 96/530, loss: 0.005608233157545328 2023-01-22 19:40:43.030093: step: 100/530, loss: 0.00014191395894158632 2023-01-22 19:40:44.122196: step: 104/530, loss: 0.0009764271671883762 2023-01-22 19:40:45.211409: step: 108/530, loss: 0.004163474775850773 2023-01-22 19:40:46.275592: step: 112/530, loss: 0.00037535608862526715 2023-01-22 19:40:47.399418: step: 116/530, loss: 0.0032862084917724133 2023-01-22 19:40:48.498667: step: 120/530, loss: 0.009096729569137096 2023-01-22 19:40:49.617638: step: 124/530, loss: 0.0022512138821184635 2023-01-22 19:40:50.702134: step: 128/530, loss: 0.002169341314584017 2023-01-22 19:40:51.842126: step: 132/530, loss: 0.005965308286249638 2023-01-22 19:40:52.933759: step: 136/530, loss: 0.011858509853482246 2023-01-22 19:40:54.014162: step: 140/530, loss: 0.0008963411673903465 2023-01-22 19:40:55.102444: step: 144/530, loss: 0.02409239299595356 2023-01-22 19:40:56.202522: step: 148/530, loss: 0.0042005423456430435 2023-01-22 19:40:57.294359: step: 152/530, loss: 0.020239807665348053 2023-01-22 19:40:58.377833: step: 156/530, loss: 0.003998726140707731 2023-01-22 19:40:59.485024: step: 160/530, loss: 0.005496561992913485 2023-01-22 19:41:00.561466: step: 164/530, loss: 0.005694527644664049 2023-01-22 19:41:01.653863: step: 168/530, loss: 0.001840868266299367 2023-01-22 19:41:02.729321: step: 172/530, loss: 0.002671318594366312 2023-01-22 19:41:03.817489: step: 176/530, loss: 0.0020116078667342663 2023-01-22 19:41:04.887082: step: 180/530, loss: 0.0010723109589889646 2023-01-22 19:41:05.974542: step: 184/530, loss: 0.008998713456094265 2023-01-22 19:41:07.065405: step: 188/530, loss: 0.002764201257377863 2023-01-22 19:41:08.159903: step: 192/530, loss: 0.00342775066383183 2023-01-22 19:41:09.235981: step: 196/530, loss: 0.006084446795284748 2023-01-22 19:41:10.319857: step: 200/530, loss: 0.0020574626978486776 2023-01-22 19:41:11.408976: step: 204/530, loss: 0.0004493702726904303 2023-01-22 19:41:12.513846: step: 208/530, loss: 0.009899861179292202 2023-01-22 19:41:13.604238: step: 212/530, loss: 0.0011038478696718812 2023-01-22 19:41:14.694862: step: 216/530, loss: 0.00041425848030485213 2023-01-22 19:41:15.771400: step: 220/530, loss: 0.007660370785742998 2023-01-22 19:41:16.864460: step: 224/530, loss: 0.008085745386779308 2023-01-22 19:41:17.970384: step: 228/530, loss: 0.005541825667023659 2023-01-22 19:41:19.064751: step: 232/530, loss: 0.0016924977535381913 2023-01-22 19:41:20.151201: step: 236/530, loss: 0.008505958132445812 2023-01-22 19:41:21.243587: step: 240/530, loss: 0.006898310501128435 2023-01-22 19:41:22.321705: step: 244/530, loss: 0.004474983084946871 2023-01-22 19:41:23.418475: step: 248/530, loss: 0.0010577687062323093 2023-01-22 19:41:24.514602: step: 252/530, loss: 0.0039393361657857895 2023-01-22 19:41:25.617672: step: 256/530, loss: 0.007406703196465969 2023-01-22 19:41:26.688487: step: 260/530, loss: 3.003341362273204e-07 2023-01-22 19:41:27.780230: step: 264/530, loss: 0.012480025179684162 2023-01-22 19:41:28.857815: step: 268/530, loss: 4.777618869411526e-06 2023-01-22 19:41:29.968288: step: 272/530, loss: 0.006687567103654146 2023-01-22 19:41:31.075253: step: 276/530, loss: 0.00017694816051516682 2023-01-22 19:41:32.162944: step: 280/530, loss: 0.0003960226022172719 2023-01-22 19:41:33.271177: step: 284/530, loss: 0.0006106164655648172 2023-01-22 19:41:34.358118: step: 288/530, loss: 0.0008020658860914409 2023-01-22 19:41:35.455721: step: 292/530, loss: 0.004469539970159531 2023-01-22 19:41:36.552858: step: 296/530, loss: 0.005460104439407587 2023-01-22 19:41:37.674756: step: 300/530, loss: 0.001034132787026465 2023-01-22 19:41:38.780718: step: 304/530, loss: 0.0002937859098892659 2023-01-22 19:41:39.881767: step: 308/530, loss: 0.007251308765262365 2023-01-22 19:41:40.961192: step: 312/530, loss: 0.00323469121940434 2023-01-22 19:41:42.065520: step: 316/530, loss: 0.011491605080664158 2023-01-22 19:41:43.148019: step: 320/530, loss: 0.0007970802835188806 2023-01-22 19:41:44.249473: step: 324/530, loss: 0.003871447406709194 2023-01-22 19:41:45.383350: step: 328/530, loss: 0.03132467716932297 2023-01-22 19:41:46.468625: step: 332/530, loss: 0.00546283321455121 2023-01-22 19:41:47.560237: step: 336/530, loss: 0.0006811360362917185 2023-01-22 19:41:48.646630: step: 340/530, loss: 0.009633843787014484 2023-01-22 19:41:49.735399: step: 344/530, loss: 0.0019323276355862617 2023-01-22 19:41:50.824401: step: 348/530, loss: 0.0005890722968615592 2023-01-22 19:41:51.906408: step: 352/530, loss: 0.011600606143474579 2023-01-22 19:41:53.013458: step: 356/530, loss: 0.0029137167148292065 2023-01-22 19:41:54.080295: step: 360/530, loss: 0.002526012249290943 2023-01-22 19:41:55.187220: step: 364/530, loss: 0.0022561270743608475 2023-01-22 19:41:56.286272: step: 368/530, loss: 0.0003573104622773826 2023-01-22 19:41:57.376003: step: 372/530, loss: 0.0012719127116724849 2023-01-22 19:41:58.500515: step: 376/530, loss: 0.0047092377208173275 2023-01-22 19:41:59.604475: step: 380/530, loss: 0.0037850087974220514 2023-01-22 19:42:00.712352: step: 384/530, loss: 0.0009696660563349724 2023-01-22 19:42:01.831662: step: 388/530, loss: 0.00386227760463953 2023-01-22 19:42:02.924611: step: 392/530, loss: 0.004639643710106611 2023-01-22 19:42:04.029773: step: 396/530, loss: 0.002485678531229496 2023-01-22 19:42:05.104471: step: 400/530, loss: 0.00032548923627473414 2023-01-22 19:42:06.206064: step: 404/530, loss: 0.002456765156239271 2023-01-22 19:42:07.274668: step: 408/530, loss: 9.76178671407979e-06 2023-01-22 19:42:08.374544: step: 412/530, loss: 0.006419209763407707 2023-01-22 19:42:09.449538: step: 416/530, loss: 0.009708626195788383 2023-01-22 19:42:10.548554: step: 420/530, loss: 0.00022630620514973998 2023-01-22 19:42:11.648153: step: 424/530, loss: 0.0035180081613361835 2023-01-22 19:42:12.755580: step: 428/530, loss: 0.0023558405227959156 2023-01-22 19:42:13.840832: step: 432/530, loss: 0.0030372757464647293 2023-01-22 19:42:14.931421: step: 436/530, loss: 0.002196301007643342 2023-01-22 19:42:16.034455: step: 440/530, loss: 0.004221763927489519 2023-01-22 19:42:17.120890: step: 444/530, loss: 0.001984473317861557 2023-01-22 19:42:18.217948: step: 448/530, loss: 0.00038633798249065876 2023-01-22 19:42:19.316905: step: 452/530, loss: 0.003452147589996457 2023-01-22 19:42:20.415467: step: 456/530, loss: 0.007510800380259752 2023-01-22 19:42:21.517786: step: 460/530, loss: 0.0007514133467338979 2023-01-22 19:42:22.611944: step: 464/530, loss: 0.000614840944763273 2023-01-22 19:42:23.707408: step: 468/530, loss: 0.009482195600867271 2023-01-22 19:42:24.798810: step: 472/530, loss: 0.0007676169043406844 2023-01-22 19:42:25.879659: step: 476/530, loss: 0.0026391278952360153 2023-01-22 19:42:26.970406: step: 480/530, loss: 0.006811762228608131 2023-01-22 19:42:28.057957: step: 484/530, loss: 0.006468001753091812 2023-01-22 19:42:29.151489: step: 488/530, loss: 0.00397089496254921 2023-01-22 19:42:30.241103: step: 492/530, loss: 0.002719681477174163 2023-01-22 19:42:31.338339: step: 496/530, loss: 0.0020633763633668423 2023-01-22 19:42:32.453492: step: 500/530, loss: 9.77211311692372e-05 2023-01-22 19:42:33.528989: step: 504/530, loss: 0.0008222581236623228 2023-01-22 19:42:34.607483: step: 508/530, loss: 0.0006518136360682547 2023-01-22 19:42:35.693907: step: 512/530, loss: 0.014863686636090279 2023-01-22 19:42:36.781835: step: 516/530, loss: 0.0010331552475690842 2023-01-22 19:42:37.873728: step: 520/530, loss: 0.00015811574121471494 2023-01-22 19:42:38.969285: step: 524/530, loss: 0.0014177013654261827 2023-01-22 19:42:40.066490: step: 528/530, loss: 0.0011622320162132382 2023-01-22 19:42:41.163500: step: 532/530, loss: 0.0053962827660143375 2023-01-22 19:42:42.283071: step: 536/530, loss: 0.0025527379475533962 2023-01-22 19:42:43.362669: step: 540/530, loss: 7.70887709222734e-05 2023-01-22 19:42:44.470633: step: 544/530, loss: 0.0022577052004635334 2023-01-22 19:42:45.562656: step: 548/530, loss: 8.863598850439303e-06 2023-01-22 19:42:46.668615: step: 552/530, loss: 0.004121160134673119 2023-01-22 19:42:47.757995: step: 556/530, loss: 0.005839852150529623 2023-01-22 19:42:48.853132: step: 560/530, loss: 4.106546384718968e-06 2023-01-22 19:42:49.922279: step: 564/530, loss: 6.0821498664154205e-06 2023-01-22 19:42:51.019818: step: 568/530, loss: 0.013007650151848793 2023-01-22 19:42:52.125161: step: 572/530, loss: 0.002608954207971692 2023-01-22 19:42:53.222789: step: 576/530, loss: 0.0001987192954402417 2023-01-22 19:42:54.326616: step: 580/530, loss: 0.0020917458459734917 2023-01-22 19:42:55.429118: step: 584/530, loss: 0.0034687542356550694 2023-01-22 19:42:56.536286: step: 588/530, loss: 0.0047590541653335094 2023-01-22 19:42:57.644541: step: 592/530, loss: 0.0007282274309545755 2023-01-22 19:42:58.715719: step: 596/530, loss: 1.887783764686901e-05 2023-01-22 19:42:59.840915: step: 600/530, loss: 0.006157950032502413 2023-01-22 19:43:00.933293: step: 604/530, loss: 0.0009968391386792064 2023-01-22 19:43:02.028603: step: 608/530, loss: 0.0010159407975152135 2023-01-22 19:43:03.095399: step: 612/530, loss: 0.00309828226454556 2023-01-22 19:43:04.184919: step: 616/530, loss: 0.003981821238994598 2023-01-22 19:43:05.286195: step: 620/530, loss: 0.0018538751173764467 2023-01-22 19:43:06.374851: step: 624/530, loss: 0.005044296383857727 2023-01-22 19:43:07.474896: step: 628/530, loss: 0.004188151098787785 2023-01-22 19:43:08.545635: step: 632/530, loss: 0.0024080753792077303 2023-01-22 19:43:09.650130: step: 636/530, loss: 0.00557094719260931 2023-01-22 19:43:10.756171: step: 640/530, loss: 0.004846950527280569 2023-01-22 19:43:11.873645: step: 644/530, loss: 0.002767184516415 2023-01-22 19:43:12.942530: step: 648/530, loss: 0.0003927384677808732 2023-01-22 19:43:14.027911: step: 652/530, loss: 0.004269721452146769 2023-01-22 19:43:15.143446: step: 656/530, loss: 0.008520129136741161 2023-01-22 19:43:16.221586: step: 660/530, loss: 0.005950061604380608 2023-01-22 19:43:17.307653: step: 664/530, loss: 7.245476444950327e-05 2023-01-22 19:43:18.393877: step: 668/530, loss: 0.0027762348763644695 2023-01-22 19:43:19.489953: step: 672/530, loss: 9.943183977156878e-05 2023-01-22 19:43:20.574909: step: 676/530, loss: 0.004367906600236893 2023-01-22 19:43:21.692335: step: 680/530, loss: 0.00047338640433736145 2023-01-22 19:43:22.790007: step: 684/530, loss: 0.0011735564330592752 2023-01-22 19:43:23.887220: step: 688/530, loss: 2.893675809900742e-05 2023-01-22 19:43:24.974382: step: 692/530, loss: 0.0009245704859495163 2023-01-22 19:43:26.073153: step: 696/530, loss: 0.0037451686803251505 2023-01-22 19:43:27.164115: step: 700/530, loss: 0.021765418350696564 2023-01-22 19:43:28.261975: step: 704/530, loss: 0.002269482472911477 2023-01-22 19:43:29.346221: step: 708/530, loss: 0.0 2023-01-22 19:43:30.428794: step: 712/530, loss: 0.0010808603838086128 2023-01-22 19:43:31.529781: step: 716/530, loss: 0.005610091611742973 2023-01-22 19:43:32.645025: step: 720/530, loss: 0.001090293750166893 2023-01-22 19:43:33.741343: step: 724/530, loss: 0.0022586656268686056 2023-01-22 19:43:34.846986: step: 728/530, loss: 0.030740924179553986 2023-01-22 19:43:35.950412: step: 732/530, loss: 0.001200369093567133 2023-01-22 19:43:37.043726: step: 736/530, loss: 0.004841573536396027 2023-01-22 19:43:38.130018: step: 740/530, loss: 0.0008445832063443959 2023-01-22 19:43:39.236180: step: 744/530, loss: 0.004193236585706472 2023-01-22 19:43:40.326482: step: 748/530, loss: 0.0038601115811616182 2023-01-22 19:43:41.413231: step: 752/530, loss: 0.0032526650466024876 2023-01-22 19:43:42.520985: step: 756/530, loss: 0.0018296608468517661 2023-01-22 19:43:43.606034: step: 760/530, loss: 3.840676072286442e-05 2023-01-22 19:43:44.706144: step: 764/530, loss: 0.0003374102816451341 2023-01-22 19:43:45.810177: step: 768/530, loss: 0.00048198073636740446 2023-01-22 19:43:46.899824: step: 772/530, loss: 0.007557819131761789 2023-01-22 19:43:48.009307: step: 776/530, loss: 0.0006743691628798842 2023-01-22 19:43:49.099405: step: 780/530, loss: 0.0028557456098496914 2023-01-22 19:43:50.198765: step: 784/530, loss: 0.0003291918837931007 2023-01-22 19:43:51.280859: step: 788/530, loss: 0.010044308379292488 2023-01-22 19:43:52.372318: step: 792/530, loss: 0.0012281634844839573 2023-01-22 19:43:53.478336: step: 796/530, loss: 0.007754568476229906 2023-01-22 19:43:54.559678: step: 800/530, loss: 0.004021527711302042 2023-01-22 19:43:55.639918: step: 804/530, loss: 0.0003520576865412295 2023-01-22 19:43:56.747106: step: 808/530, loss: 0.0032094307243824005 2023-01-22 19:43:57.861566: step: 812/530, loss: 0.0008712415001355112 2023-01-22 19:43:58.948376: step: 816/530, loss: 0.007400264963507652 2023-01-22 19:44:00.036440: step: 820/530, loss: 0.005930343642830849 2023-01-22 19:44:01.127808: step: 824/530, loss: 0.006092222407460213 2023-01-22 19:44:02.223092: step: 828/530, loss: 0.007556985132396221 2023-01-22 19:44:03.310240: step: 832/530, loss: 0.0025327824987471104 2023-01-22 19:44:04.406401: step: 836/530, loss: 0.011381884105503559 2023-01-22 19:44:05.515780: step: 840/530, loss: 0.0039446656592190266 2023-01-22 19:44:06.629186: step: 844/530, loss: 0.008466324768960476 2023-01-22 19:44:07.715532: step: 848/530, loss: 6.4050109358504415e-06 2023-01-22 19:44:08.805313: step: 852/530, loss: 0.007452858611941338 2023-01-22 19:44:09.907115: step: 856/530, loss: 0.01534226629883051 2023-01-22 19:44:10.989662: step: 860/530, loss: 6.664237844233867e-06 2023-01-22 19:44:12.094892: step: 864/530, loss: 5.0291376396671694e-08 2023-01-22 19:44:13.191407: step: 868/530, loss: 0.019897237420082092 2023-01-22 19:44:14.266116: step: 872/530, loss: 0.0039535523392260075 2023-01-22 19:44:15.342464: step: 876/530, loss: 0.012000597082078457 2023-01-22 19:44:16.451183: step: 880/530, loss: 0.039778389036655426 2023-01-22 19:44:17.530788: step: 884/530, loss: 0.002352713607251644 2023-01-22 19:44:18.618286: step: 888/530, loss: 0.0013583969557657838 2023-01-22 19:44:19.710030: step: 892/530, loss: 0.0005925582372583449 2023-01-22 19:44:20.806852: step: 896/530, loss: 0.0014661260647699237 2023-01-22 19:44:21.879188: step: 900/530, loss: 0.0003891157975886017 2023-01-22 19:44:22.972284: step: 904/530, loss: 0.001099692191928625 2023-01-22 19:44:24.072820: step: 908/530, loss: 0.0011839447543025017 2023-01-22 19:44:25.169842: step: 912/530, loss: 0.0001947626005858183 2023-01-22 19:44:26.277364: step: 916/530, loss: 0.017845891416072845 2023-01-22 19:44:27.393833: step: 920/530, loss: 0.0017318632453680038 2023-01-22 19:44:28.475048: step: 924/530, loss: 0.0030967986676841974 2023-01-22 19:44:29.546740: step: 928/530, loss: 0.006518544163554907 2023-01-22 19:44:30.639314: step: 932/530, loss: 0.004933425225317478 2023-01-22 19:44:31.731949: step: 936/530, loss: 0.021260403096675873 2023-01-22 19:44:32.822948: step: 940/530, loss: 0.006665264256298542 2023-01-22 19:44:33.934759: step: 944/530, loss: 0.0007224353612400591 2023-01-22 19:44:35.024197: step: 948/530, loss: 0.004189273342490196 2023-01-22 19:44:36.137434: step: 952/530, loss: 0.0008263826020993292 2023-01-22 19:44:37.246728: step: 956/530, loss: 0.00208522891625762 2023-01-22 19:44:38.341322: step: 960/530, loss: 0.0052817403338849545 2023-01-22 19:44:39.424613: step: 964/530, loss: 0.0019786537159234285 2023-01-22 19:44:40.527338: step: 968/530, loss: 0.0011980137787759304 2023-01-22 19:44:41.613385: step: 972/530, loss: 0.003914820495992899 2023-01-22 19:44:42.712255: step: 976/530, loss: 0.0023069828748703003 2023-01-22 19:44:43.802168: step: 980/530, loss: 0.004015594255179167 2023-01-22 19:44:44.897328: step: 984/530, loss: 0.004730938468128443 2023-01-22 19:44:45.983633: step: 988/530, loss: 0.004416345153003931 2023-01-22 19:44:47.072595: step: 992/530, loss: 0.00339575856924057 2023-01-22 19:44:48.192503: step: 996/530, loss: 0.0026151412166655064 2023-01-22 19:44:49.271853: step: 1000/530, loss: 0.0025615852791815996 2023-01-22 19:44:50.384168: step: 1004/530, loss: 0.002780602080747485 2023-01-22 19:44:51.467707: step: 1008/530, loss: 0.0024323835968971252 2023-01-22 19:44:52.559213: step: 1012/530, loss: 0.0017398330383002758 2023-01-22 19:44:53.652760: step: 1016/530, loss: 0.0017514735227450728 2023-01-22 19:44:54.722170: step: 1020/530, loss: 0.0011801804648712277 2023-01-22 19:44:55.820246: step: 1024/530, loss: 0.010364910587668419 2023-01-22 19:44:56.923441: step: 1028/530, loss: 0.0030158699955791235 2023-01-22 19:44:58.007581: step: 1032/530, loss: 0.000503338931594044 2023-01-22 19:44:59.112976: step: 1036/530, loss: 0.003913387656211853 2023-01-22 19:45:00.219518: step: 1040/530, loss: 0.0008146704640239477 2023-01-22 19:45:01.305954: step: 1044/530, loss: 0.002618949394673109 2023-01-22 19:45:02.413308: step: 1048/530, loss: 5.17438274982851e-05 2023-01-22 19:45:03.513076: step: 1052/530, loss: 0.00746112409979105 2023-01-22 19:45:04.615888: step: 1056/530, loss: 0.05978460982441902 2023-01-22 19:45:05.717670: step: 1060/530, loss: 0.01746443286538124 2023-01-22 19:45:06.843124: step: 1064/530, loss: 0.0065761590376496315 2023-01-22 19:45:07.959425: step: 1068/530, loss: 0.00971446093171835 2023-01-22 19:45:09.027804: step: 1072/530, loss: 0.004888199269771576 2023-01-22 19:45:10.135587: step: 1076/530, loss: 0.0019925145898014307 2023-01-22 19:45:11.198131: step: 1080/530, loss: 0.0013363719917833805 2023-01-22 19:45:12.304372: step: 1084/530, loss: 0.009254733100533485 2023-01-22 19:45:13.379854: step: 1088/530, loss: 0.0003369998885318637 2023-01-22 19:45:14.494044: step: 1092/530, loss: 0.006268787197768688 2023-01-22 19:45:15.581441: step: 1096/530, loss: 0.008753328584134579 2023-01-22 19:45:16.683641: step: 1100/530, loss: 0.0003484312037471682 2023-01-22 19:45:17.771050: step: 1104/530, loss: 0.006100955884903669 2023-01-22 19:45:18.849858: step: 1108/530, loss: 0.00019000712200067937 2023-01-22 19:45:19.940153: step: 1112/530, loss: 0.011058731004595757 2023-01-22 19:45:21.019904: step: 1116/530, loss: 0.0030486814212054014 2023-01-22 19:45:22.090232: step: 1120/530, loss: 0.005386482924222946 2023-01-22 19:45:23.164336: step: 1124/530, loss: 0.00038144763675518334 2023-01-22 19:45:24.254530: step: 1128/530, loss: 0.003398491069674492 2023-01-22 19:45:25.332703: step: 1132/530, loss: 0.0002537529217079282 2023-01-22 19:45:26.425852: step: 1136/530, loss: 0.002493631560355425 2023-01-22 19:45:27.518889: step: 1140/530, loss: 0.002667548367753625 2023-01-22 19:45:28.591278: step: 1144/530, loss: 0.019800031557679176 2023-01-22 19:45:29.665693: step: 1148/530, loss: 0.009160289540886879 2023-01-22 19:45:30.762115: step: 1152/530, loss: 0.0018552790861576796 2023-01-22 19:45:31.869661: step: 1156/530, loss: 0.0043502552434802055 2023-01-22 19:45:32.973223: step: 1160/530, loss: 0.0003805956512223929 2023-01-22 19:45:34.049086: step: 1164/530, loss: 0.000876463542226702 2023-01-22 19:45:35.122214: step: 1168/530, loss: 2.4589211534475908e-05 2023-01-22 19:45:36.245426: step: 1172/530, loss: 0.0008695876458659768 2023-01-22 19:45:37.324869: step: 1176/530, loss: 0.0009143345523625612 2023-01-22 19:45:38.429136: step: 1180/530, loss: 0.0020415079779922962 2023-01-22 19:45:39.521503: step: 1184/530, loss: 0.002801405033096671 2023-01-22 19:45:40.599363: step: 1188/530, loss: 0.0018937858985736966 2023-01-22 19:45:41.691616: step: 1192/530, loss: 0.00959955994039774 2023-01-22 19:45:42.795887: step: 1196/530, loss: 0.004226675722748041 2023-01-22 19:45:43.874022: step: 1200/530, loss: 2.4448534531984478e-05 2023-01-22 19:45:44.958130: step: 1204/530, loss: 0.011197513900697231 2023-01-22 19:45:46.045555: step: 1208/530, loss: 0.013362959958612919 2023-01-22 19:45:47.118771: step: 1212/530, loss: 0.0010965893743559718 2023-01-22 19:45:48.213168: step: 1216/530, loss: 0.0026229280047118664 2023-01-22 19:45:49.312145: step: 1220/530, loss: 0.005070118233561516 2023-01-22 19:45:50.409268: step: 1224/530, loss: 0.0026583687867969275 2023-01-22 19:45:51.494975: step: 1228/530, loss: 0.003312967484816909 2023-01-22 19:45:52.590234: step: 1232/530, loss: 0.0008142516599036753 2023-01-22 19:45:53.707033: step: 1236/530, loss: 0.0021133790723979473 2023-01-22 19:45:54.787998: step: 1240/530, loss: 0.0034803026355803013 2023-01-22 19:45:55.880611: step: 1244/530, loss: 0.0067142341285943985 2023-01-22 19:45:56.949747: step: 1248/530, loss: 0.008614704012870789 2023-01-22 19:45:58.032493: step: 1252/530, loss: 0.0012909629149362445 2023-01-22 19:45:59.099423: step: 1256/530, loss: 0.0015210537239909172 2023-01-22 19:46:00.193745: step: 1260/530, loss: 0.00339047540910542 2023-01-22 19:46:01.281407: step: 1264/530, loss: 0.0027066462207585573 2023-01-22 19:46:02.357976: step: 1268/530, loss: 0.000420679192757234 2023-01-22 19:46:03.445146: step: 1272/530, loss: 0.02238692343235016 2023-01-22 19:46:04.550242: step: 1276/530, loss: 0.0003682363894768059 2023-01-22 19:46:05.664991: step: 1280/530, loss: 0.007898399606347084 2023-01-22 19:46:06.753631: step: 1284/530, loss: 4.020193046017084e-06 2023-01-22 19:46:07.855626: step: 1288/530, loss: 0.0008638929575681686 2023-01-22 19:46:08.976611: step: 1292/530, loss: 0.008006955496966839 2023-01-22 19:46:10.092657: step: 1296/530, loss: 0.00043161181383766234 2023-01-22 19:46:11.174131: step: 1300/530, loss: 0.0001510414876975119 2023-01-22 19:46:12.308559: step: 1304/530, loss: 0.0007518358179368079 2023-01-22 19:46:13.403908: step: 1308/530, loss: 0.0006505374331027269 2023-01-22 19:46:14.486691: step: 1312/530, loss: 0.004661477170884609 2023-01-22 19:46:15.572691: step: 1316/530, loss: 0.0009284016559831798 2023-01-22 19:46:16.668487: step: 1320/530, loss: 0.012900302186608315 2023-01-22 19:46:17.729675: step: 1324/530, loss: 0.005833383649587631 2023-01-22 19:46:18.814963: step: 1328/530, loss: 1.515905387350358e-05 2023-01-22 19:46:19.889320: step: 1332/530, loss: 0.0018105567432940006 2023-01-22 19:46:20.989690: step: 1336/530, loss: 0.002501973882317543 2023-01-22 19:46:22.072244: step: 1340/530, loss: 0.003806342603638768 2023-01-22 19:46:23.164820: step: 1344/530, loss: 0.011848351918160915 2023-01-22 19:46:24.260100: step: 1348/530, loss: 0.0026647765189409256 2023-01-22 19:46:25.383770: step: 1352/530, loss: 0.010918958112597466 2023-01-22 19:46:26.471085: step: 1356/530, loss: 0.0034258549567312002 2023-01-22 19:46:27.563747: step: 1360/530, loss: 0.02496151439845562 2023-01-22 19:46:28.642193: step: 1364/530, loss: 0.0033963769674301147 2023-01-22 19:46:29.720994: step: 1368/530, loss: 0.0012569841928780079 2023-01-22 19:46:30.812075: step: 1372/530, loss: 0.014646589756011963 2023-01-22 19:46:31.945506: step: 1376/530, loss: 0.00520023750141263 2023-01-22 19:46:33.026099: step: 1380/530, loss: 0.008949876762926579 2023-01-22 19:46:34.102098: step: 1384/530, loss: 0.014099440537393093 2023-01-22 19:46:35.182076: step: 1388/530, loss: 0.0017189332284033298 2023-01-22 19:46:36.281635: step: 1392/530, loss: 0.009262565523386002 2023-01-22 19:46:37.367770: step: 1396/530, loss: 0.0012344110291451216 2023-01-22 19:46:38.455734: step: 1400/530, loss: 0.0008225159836001694 2023-01-22 19:46:39.576345: step: 1404/530, loss: 0.0014936174266040325 2023-01-22 19:46:40.688671: step: 1408/530, loss: 0.003664296120405197 2023-01-22 19:46:41.825577: step: 1412/530, loss: 0.00030481244903057814 2023-01-22 19:46:42.926540: step: 1416/530, loss: 0.002614325378090143 2023-01-22 19:46:44.021332: step: 1420/530, loss: 0.007549910340458155 2023-01-22 19:46:45.125822: step: 1424/530, loss: 0.038141150027513504 2023-01-22 19:46:46.211644: step: 1428/530, loss: 0.004947444889694452 2023-01-22 19:46:47.339941: step: 1432/530, loss: 0.00578342517837882 2023-01-22 19:46:48.422092: step: 1436/530, loss: 0.005597495473921299 2023-01-22 19:46:49.505236: step: 1440/530, loss: 0.0017578318947926164 2023-01-22 19:46:50.589417: step: 1444/530, loss: 0.003772624535486102 2023-01-22 19:46:51.687144: step: 1448/530, loss: 0.008857645094394684 2023-01-22 19:46:52.768970: step: 1452/530, loss: 0.00011549842020031065 2023-01-22 19:46:53.884854: step: 1456/530, loss: 0.004917779937386513 2023-01-22 19:46:54.979686: step: 1460/530, loss: 0.0004713029193226248 2023-01-22 19:46:56.066320: step: 1464/530, loss: 3.580367410904728e-05 2023-01-22 19:46:57.155413: step: 1468/530, loss: 0.024880684912204742 2023-01-22 19:46:58.269785: step: 1472/530, loss: 0.015539719723165035 2023-01-22 19:46:59.360301: step: 1476/530, loss: 0.0030423651915043592 2023-01-22 19:47:00.444465: step: 1480/530, loss: 0.0005326632526703179 2023-01-22 19:47:01.583752: step: 1484/530, loss: 0.00669434666633606 2023-01-22 19:47:02.664465: step: 1488/530, loss: 0.006360972300171852 2023-01-22 19:47:03.770108: step: 1492/530, loss: 0.004966961685568094 2023-01-22 19:47:04.881216: step: 1496/530, loss: 7.674341031815857e-05 2023-01-22 19:47:05.984761: step: 1500/530, loss: 0.000766607525292784 2023-01-22 19:47:07.057644: step: 1504/530, loss: 0.002515893429517746 2023-01-22 19:47:08.159291: step: 1508/530, loss: 0.007046996150165796 2023-01-22 19:47:09.266163: step: 1512/530, loss: 0.0013534441823139787 2023-01-22 19:47:10.336864: step: 1516/530, loss: 0.002146252663806081 2023-01-22 19:47:11.409429: step: 1520/530, loss: 0.0004873658763244748 2023-01-22 19:47:12.525140: step: 1524/530, loss: 0.004555124323815107 2023-01-22 19:47:13.618187: step: 1528/530, loss: 0.0035639917477965355 2023-01-22 19:47:14.689071: step: 1532/530, loss: 0.007021291647106409 2023-01-22 19:47:15.767495: step: 1536/530, loss: 0.007638323120772839 2023-01-22 19:47:16.857019: step: 1540/530, loss: 0.00022224440181162208 2023-01-22 19:47:17.956160: step: 1544/530, loss: 0.001797450939193368 2023-01-22 19:47:19.053675: step: 1548/530, loss: 0.004820940550416708 2023-01-22 19:47:20.157399: step: 1552/530, loss: 0.00698222778737545 2023-01-22 19:47:21.264482: step: 1556/530, loss: 0.0018218755722045898 2023-01-22 19:47:22.356813: step: 1560/530, loss: 0.0015776666114106774 2023-01-22 19:47:23.449757: step: 1564/530, loss: 0.0002898024977184832 2023-01-22 19:47:24.541585: step: 1568/530, loss: 0.0038671568036079407 2023-01-22 19:47:25.633169: step: 1572/530, loss: 0.018185589462518692 2023-01-22 19:47:26.746696: step: 1576/530, loss: 0.005456727463752031 2023-01-22 19:47:27.838058: step: 1580/530, loss: 0.009965651668608189 2023-01-22 19:47:28.941305: step: 1584/530, loss: 0.0066036018542945385 2023-01-22 19:47:30.039960: step: 1588/530, loss: 0.00564106460660696 2023-01-22 19:47:31.114948: step: 1592/530, loss: 0.002011688658967614 2023-01-22 19:47:32.198799: step: 1596/530, loss: 0.0003201515937689692 2023-01-22 19:47:33.311245: step: 1600/530, loss: 0.002538562985137105 2023-01-22 19:47:34.406287: step: 1604/530, loss: 0.017771240323781967 2023-01-22 19:47:35.489449: step: 1608/530, loss: 0.00866878405213356 2023-01-22 19:47:36.589044: step: 1612/530, loss: 0.003042306285351515 2023-01-22 19:47:37.686192: step: 1616/530, loss: 0.005300478078424931 2023-01-22 19:47:38.761377: step: 1620/530, loss: 0.005812700837850571 2023-01-22 19:47:39.880522: step: 1624/530, loss: 0.002968069165945053 2023-01-22 19:47:40.964210: step: 1628/530, loss: 0.004015675280243158 2023-01-22 19:47:42.058856: step: 1632/530, loss: 0.007417803164571524 2023-01-22 19:47:43.168582: step: 1636/530, loss: 0.00010906918032560498 2023-01-22 19:47:44.285438: step: 1640/530, loss: 0.0008300939225591719 2023-01-22 19:47:45.392617: step: 1644/530, loss: 0.03929116204380989 2023-01-22 19:47:46.484489: step: 1648/530, loss: 0.003633128711953759 2023-01-22 19:47:47.586862: step: 1652/530, loss: 0.0004056805628351867 2023-01-22 19:47:48.691171: step: 1656/530, loss: 0.00047271084622479975 2023-01-22 19:47:49.784580: step: 1660/530, loss: 0.00017324018699582666 2023-01-22 19:47:50.880419: step: 1664/530, loss: 0.0009093162370845675 2023-01-22 19:47:51.984290: step: 1668/530, loss: 0.0016274412628263235 2023-01-22 19:47:53.063703: step: 1672/530, loss: 2.1692556401831098e-05 2023-01-22 19:47:54.155696: step: 1676/530, loss: 0.002160932868719101 2023-01-22 19:47:55.243618: step: 1680/530, loss: 0.002776879584416747 2023-01-22 19:47:56.317594: step: 1684/530, loss: 0.0 2023-01-22 19:47:57.417008: step: 1688/530, loss: 0.001768921036273241 2023-01-22 19:47:58.508447: step: 1692/530, loss: 8.10049386927858e-05 2023-01-22 19:47:59.589253: step: 1696/530, loss: 0.0010290194768458605 2023-01-22 19:48:00.700673: step: 1700/530, loss: 0.004831664729863405 2023-01-22 19:48:01.785231: step: 1704/530, loss: 0.004273466765880585 2023-01-22 19:48:02.889142: step: 1708/530, loss: 0.003378627821803093 2023-01-22 19:48:03.962057: step: 1712/530, loss: 0.004147721920162439 2023-01-22 19:48:05.062080: step: 1716/530, loss: 0.004268621560186148 2023-01-22 19:48:06.162530: step: 1720/530, loss: 0.004693754017353058 2023-01-22 19:48:07.272596: step: 1724/530, loss: 0.004603015258908272 2023-01-22 19:48:08.374229: step: 1728/530, loss: 0.08938749134540558 2023-01-22 19:48:09.461426: step: 1732/530, loss: 0.005390554666519165 2023-01-22 19:48:10.560963: step: 1736/530, loss: 0.0003526887157931924 2023-01-22 19:48:11.667460: step: 1740/530, loss: 0.010446108877658844 2023-01-22 19:48:12.785005: step: 1744/530, loss: 0.00035366369411349297 2023-01-22 19:48:13.885223: step: 1748/530, loss: 0.002506296383216977 2023-01-22 19:48:14.957936: step: 1752/530, loss: 0.0028603640384972095 2023-01-22 19:48:16.052361: step: 1756/530, loss: 0.0045945653691887856 2023-01-22 19:48:17.166988: step: 1760/530, loss: 0.004601327236741781 2023-01-22 19:48:18.271526: step: 1764/530, loss: 0.013493113219738007 2023-01-22 19:48:19.348444: step: 1768/530, loss: 0.0003100834437645972 2023-01-22 19:48:20.446454: step: 1772/530, loss: 0.013857807964086533 2023-01-22 19:48:21.549348: step: 1776/530, loss: 0.003310558618977666 2023-01-22 19:48:22.620550: step: 1780/530, loss: 0.002016305923461914 2023-01-22 19:48:23.748486: step: 1784/530, loss: 0.004242977127432823 2023-01-22 19:48:24.861171: step: 1788/530, loss: 0.004578152671456337 2023-01-22 19:48:25.963284: step: 1792/530, loss: 0.0019369639921933413 2023-01-22 19:48:27.067756: step: 1796/530, loss: 7.450491921190405e-07 2023-01-22 19:48:28.168456: step: 1800/530, loss: 0.0041890013962984085 2023-01-22 19:48:29.260651: step: 1804/530, loss: 0.0003966613730881363 2023-01-22 19:48:30.349197: step: 1808/530, loss: 0.0009504702175036073 2023-01-22 19:48:31.436088: step: 1812/530, loss: 0.0070826588198542595 2023-01-22 19:48:32.550467: step: 1816/530, loss: 0.00793431419879198 2023-01-22 19:48:33.624534: step: 1820/530, loss: 0.0007111338200047612 2023-01-22 19:48:34.744499: step: 1824/530, loss: 0.02384822629392147 2023-01-22 19:48:35.858083: step: 1828/530, loss: 0.011601111851632595 2023-01-22 19:48:36.947120: step: 1832/530, loss: 0.000378284981707111 2023-01-22 19:48:38.030853: step: 1836/530, loss: 0.004807294346392155 2023-01-22 19:48:39.115636: step: 1840/530, loss: 0.0010158069198951125 2023-01-22 19:48:40.195998: step: 1844/530, loss: 0.004164641257375479 2023-01-22 19:48:41.269215: step: 1848/530, loss: 0.0009046039776876569 2023-01-22 19:48:42.365563: step: 1852/530, loss: 6.486716756626265e-06 2023-01-22 19:48:43.457582: step: 1856/530, loss: 0.003988295793533325 2023-01-22 19:48:44.557917: step: 1860/530, loss: 0.002295270562171936 2023-01-22 19:48:45.643188: step: 1864/530, loss: 0.0038218514528125525 2023-01-22 19:48:46.719121: step: 1868/530, loss: 0.0015781333204358816 2023-01-22 19:48:47.796461: step: 1872/530, loss: 0.008558275178074837 2023-01-22 19:48:48.920211: step: 1876/530, loss: 0.005718821659684181 2023-01-22 19:48:50.032585: step: 1880/530, loss: 0.0019060020567849278 2023-01-22 19:48:51.128976: step: 1884/530, loss: 0.011836216785013676 2023-01-22 19:48:52.214673: step: 1888/530, loss: 0.0028520463965833187 2023-01-22 19:48:53.324980: step: 1892/530, loss: 0.011126195080578327 2023-01-22 19:48:54.438904: step: 1896/530, loss: 0.005881585646420717 2023-01-22 19:48:55.530961: step: 1900/530, loss: 0.0021082295570522547 2023-01-22 19:48:56.632874: step: 1904/530, loss: 0.0027009572368115187 2023-01-22 19:48:57.734521: step: 1908/530, loss: 0.006047988776117563 2023-01-22 19:48:58.840126: step: 1912/530, loss: 0.0039531332440674305 2023-01-22 19:48:59.933346: step: 1916/530, loss: 0.005742067936807871 2023-01-22 19:49:01.006107: step: 1920/530, loss: 0.0011928094318136573 2023-01-22 19:49:02.093173: step: 1924/530, loss: 0.0011774139711633325 2023-01-22 19:49:03.188321: step: 1928/530, loss: 0.0015301486710086465 2023-01-22 19:49:04.274702: step: 1932/530, loss: 0.003928130026906729 2023-01-22 19:49:05.370697: step: 1936/530, loss: 0.0003547614032868296 2023-01-22 19:49:06.462022: step: 1940/530, loss: 0.0043481444008648396 2023-01-22 19:49:07.542726: step: 1944/530, loss: 0.003280860371887684 2023-01-22 19:49:08.652292: step: 1948/530, loss: 0.0063994633965194225 2023-01-22 19:49:09.761520: step: 1952/530, loss: 0.0040566879324615 2023-01-22 19:49:10.847242: step: 1956/530, loss: 1.2758776392729487e-05 2023-01-22 19:49:11.961250: step: 1960/530, loss: 0.002702544443309307 2023-01-22 19:49:13.052447: step: 1964/530, loss: 0.004193741362541914 2023-01-22 19:49:14.117489: step: 1968/530, loss: 0.003984420094639063 2023-01-22 19:49:15.215593: step: 1972/530, loss: 0.003577832132577896 2023-01-22 19:49:16.304003: step: 1976/530, loss: 0.004695831798017025 2023-01-22 19:49:17.389364: step: 1980/530, loss: 0.00024278204364236444 2023-01-22 19:49:18.486816: step: 1984/530, loss: 0.00016520480858162045 2023-01-22 19:49:19.580262: step: 1988/530, loss: 0.0004756670678034425 2023-01-22 19:49:20.694829: step: 1992/530, loss: 0.005009965039789677 2023-01-22 19:49:21.766891: step: 1996/530, loss: 0.00016160421364475042 2023-01-22 19:49:22.864728: step: 2000/530, loss: 0.002480706898495555 2023-01-22 19:49:23.979495: step: 2004/530, loss: 0.00024894674425013363 2023-01-22 19:49:25.087956: step: 2008/530, loss: 0.006939046084880829 2023-01-22 19:49:26.176355: step: 2012/530, loss: 0.02630123309791088 2023-01-22 19:49:27.273273: step: 2016/530, loss: 0.001474782358855009 2023-01-22 19:49:28.356471: step: 2020/530, loss: 0.004352755844593048 2023-01-22 19:49:29.452543: step: 2024/530, loss: 0.013139724731445312 2023-01-22 19:49:30.535514: step: 2028/530, loss: 4.3009305954910815e-05 2023-01-22 19:49:31.636126: step: 2032/530, loss: 0.0018679157365113497 2023-01-22 19:49:32.738686: step: 2036/530, loss: 0.0032187236938625574 2023-01-22 19:49:33.843821: step: 2040/530, loss: 0.0013946050312370062 2023-01-22 19:49:34.918932: step: 2044/530, loss: 0.004480474628508091 2023-01-22 19:49:36.012031: step: 2048/530, loss: 0.00010630625183694065 2023-01-22 19:49:37.140229: step: 2052/530, loss: 0.02964196354150772 2023-01-22 19:49:38.225344: step: 2056/530, loss: 0.006195282097905874 2023-01-22 19:49:39.310616: step: 2060/530, loss: 0.005950705148279667 2023-01-22 19:49:40.412669: step: 2064/530, loss: 0.006208291742950678 2023-01-22 19:49:41.493326: step: 2068/530, loss: 0.0176533255726099 2023-01-22 19:49:42.587083: step: 2072/530, loss: 0.0007111184531822801 2023-01-22 19:49:43.664373: step: 2076/530, loss: 0.0028486649971455336 2023-01-22 19:49:44.754399: step: 2080/530, loss: 0.0017024489352479577 2023-01-22 19:49:45.826580: step: 2084/530, loss: 0.00044607679592445493 2023-01-22 19:49:46.898399: step: 2088/530, loss: 0.005664762109518051 2023-01-22 19:49:47.994515: step: 2092/530, loss: 0.011150743812322617 2023-01-22 19:49:49.081484: step: 2096/530, loss: 0.0023099160753190517 2023-01-22 19:49:50.169541: step: 2100/530, loss: 0.007214162033051252 2023-01-22 19:49:51.264920: step: 2104/530, loss: 0.001990193733945489 2023-01-22 19:49:52.356445: step: 2108/530, loss: 0.003204174805432558 2023-01-22 19:49:53.443533: step: 2112/530, loss: 0.002190495142713189 2023-01-22 19:49:54.531476: step: 2116/530, loss: 0.0008908937452360988 2023-01-22 19:49:55.635685: step: 2120/530, loss: 0.004174768924713135 ================================================== Loss: 0.005 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3353593710211357, 'r': 0.3569954594741122, 'f1': 0.3458393513655462}, 'combined': 0.254828995743034, 'stategy': 1, 'epoch': 13} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3353026945447007, 'r': 0.2875444472505, 'f1': 0.30959258378088983}, 'combined': 0.1922732888744474, 'stategy': 1, 'epoch': 13} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3463071521960457, 'r': 0.3436786349118252, 'f1': 0.3449878868543464}, 'combined': 0.2542016008400447, 'stategy': 1, 'epoch': 13} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3215244045174571, 'r': 0.28685955773961064, 'f1': 0.3032044044691546}, 'combined': 0.188305893301896, 'stategy': 1, 'epoch': 13} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3404785076596817, 'r': 0.3275571221697507, 'f1': 0.3338928498712933}, 'combined': 0.24602631043147927, 'stategy': 1, 'epoch': 13} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3465677113481918, 'r': 0.2938812083396809, 'f1': 0.31805733338471875}, 'combined': 0.19753034389156218, 'stategy': 1, 'epoch': 13} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 13} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.38636363636363635, 'r': 0.5543478260869565, 'f1': 0.4553571428571429}, 'combined': 0.22767857142857145, 'stategy': 1, 'epoch': 13} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 13} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 14 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 19:52:28.290484: step: 4/530, loss: 0.00041957953362725675 2023-01-22 19:52:29.369196: step: 8/530, loss: 0.0012305567506700754 2023-01-22 19:52:30.434215: step: 12/530, loss: 0.0003846187610179186 2023-01-22 19:52:31.544467: step: 16/530, loss: 0.0017954891081899405 2023-01-22 19:52:32.618048: step: 20/530, loss: 0.005422938149422407 2023-01-22 19:52:33.698648: step: 24/530, loss: 0.002643261570483446 2023-01-22 19:52:34.783881: step: 28/530, loss: 0.0018135977443307638 2023-01-22 19:52:35.860591: step: 32/530, loss: 0.00037464252091012895 2023-01-22 19:52:36.935899: step: 36/530, loss: 0.0020497890654951334 2023-01-22 19:52:38.014359: step: 40/530, loss: 0.006587619427591562 2023-01-22 19:52:39.094842: step: 44/530, loss: 0.0009700774680823088 2023-01-22 19:52:40.203384: step: 48/530, loss: 0.0007794132689014077 2023-01-22 19:52:41.286463: step: 52/530, loss: 0.009133766405284405 2023-01-22 19:52:42.357780: step: 56/530, loss: 0.0033496320247650146 2023-01-22 19:52:43.455765: step: 60/530, loss: 0.011073989793658257 2023-01-22 19:52:44.530000: step: 64/530, loss: 0.004006025847047567 2023-01-22 19:52:45.616707: step: 68/530, loss: 0.0008794956956990063 2023-01-22 19:52:46.725161: step: 72/530, loss: 0.005165646784007549 2023-01-22 19:52:47.807353: step: 76/530, loss: 0.011668819934129715 2023-01-22 19:52:48.875135: step: 80/530, loss: 0.0006029019132256508 2023-01-22 19:52:49.953666: step: 84/530, loss: 0.0005558215198107064 2023-01-22 19:52:51.060412: step: 88/530, loss: 0.0032922138925641775 2023-01-22 19:52:52.156841: step: 92/530, loss: 0.0003902245662175119 2023-01-22 19:52:53.252300: step: 96/530, loss: 0.005438562016934156 2023-01-22 19:52:54.343758: step: 100/530, loss: 0.0003223950625397265 2023-01-22 19:52:55.429986: step: 104/530, loss: 0.0024952334351837635 2023-01-22 19:52:56.532461: step: 108/530, loss: 0.0030183882918208838 2023-01-22 19:52:57.622507: step: 112/530, loss: 0.0002886571455746889 2023-01-22 19:52:58.698982: step: 116/530, loss: 0.007234872318804264 2023-01-22 19:52:59.796329: step: 120/530, loss: 0.0008107398170977831 2023-01-22 19:53:00.886348: step: 124/530, loss: 0.0011682487092912197 2023-01-22 19:53:01.962587: step: 128/530, loss: 0.00020595089881680906 2023-01-22 19:53:03.045977: step: 132/530, loss: 0.00039724650559946895 2023-01-22 19:53:04.118094: step: 136/530, loss: 0.007038023788481951 2023-01-22 19:53:05.206066: step: 140/530, loss: 0.0032320325262844563 2023-01-22 19:53:06.313508: step: 144/530, loss: 0.009678706526756287 2023-01-22 19:53:07.390300: step: 148/530, loss: 0.003409762866795063 2023-01-22 19:53:08.487267: step: 152/530, loss: 0.0020736628212034702 2023-01-22 19:53:09.559130: step: 156/530, loss: 0.001371394144371152 2023-01-22 19:53:10.633193: step: 160/530, loss: 0.0038567499723285437 2023-01-22 19:53:11.714487: step: 164/530, loss: 0.003594342153519392 2023-01-22 19:53:12.807442: step: 168/530, loss: 0.002544281305745244 2023-01-22 19:53:13.888084: step: 172/530, loss: 0.0010763269383460283 2023-01-22 19:53:14.960482: step: 176/530, loss: 0.00584668293595314 2023-01-22 19:53:16.035700: step: 180/530, loss: 0.005828606430441141 2023-01-22 19:53:17.115412: step: 184/530, loss: 6.124362698756158e-06 2023-01-22 19:53:18.196214: step: 188/530, loss: 0.0013317487901076674 2023-01-22 19:53:19.274759: step: 192/530, loss: 0.0005292042624205351 2023-01-22 19:53:20.375044: step: 196/530, loss: 0.0014115390367805958 2023-01-22 19:53:21.459161: step: 200/530, loss: 0.0025520212948322296 2023-01-22 19:53:22.559721: step: 204/530, loss: 0.005806716158986092 2023-01-22 19:53:23.662141: step: 208/530, loss: 0.0013863842468708754 2023-01-22 19:53:24.749414: step: 212/530, loss: 2.3006439732853323e-05 2023-01-22 19:53:25.837171: step: 216/530, loss: 0.0016012545675039291 2023-01-22 19:53:26.918195: step: 220/530, loss: 0.0009532867697998881 2023-01-22 19:53:28.033197: step: 224/530, loss: 0.0001585626305313781 2023-01-22 19:53:29.148811: step: 228/530, loss: 0.0008216666174121201 2023-01-22 19:53:30.221006: step: 232/530, loss: 0.0181658286601305 2023-01-22 19:53:31.308992: step: 236/530, loss: 0.0004386380023788661 2023-01-22 19:53:32.392845: step: 240/530, loss: 0.0039194850251078606 2023-01-22 19:53:33.477156: step: 244/530, loss: 0.0023481573443859816 2023-01-22 19:53:34.545555: step: 248/530, loss: 0.00583037082105875 2023-01-22 19:53:35.658897: step: 252/530, loss: 0.00710871908813715 2023-01-22 19:53:36.747125: step: 256/530, loss: 0.012729004956781864 2023-01-22 19:53:37.836711: step: 260/530, loss: 0.026176651939749718 2023-01-22 19:53:38.921815: step: 264/530, loss: 4.958019781042822e-05 2023-01-22 19:53:40.008487: step: 268/530, loss: 0.027267776429653168 2023-01-22 19:53:41.137585: step: 272/530, loss: 0.0014167454792186618 2023-01-22 19:53:42.274711: step: 276/530, loss: 0.006288043223321438 2023-01-22 19:53:43.366187: step: 280/530, loss: 0.0007312045199796557 2023-01-22 19:53:44.474652: step: 284/530, loss: 0.00029566502780653536 2023-01-22 19:53:45.573316: step: 288/530, loss: 0.0020559243857860565 2023-01-22 19:53:46.660966: step: 292/530, loss: 0.00029819586779922247 2023-01-22 19:53:47.748995: step: 296/530, loss: 0.0036456305533647537 2023-01-22 19:53:48.806403: step: 300/530, loss: 8.203275683626998e-06 2023-01-22 19:53:49.886304: step: 304/530, loss: 0.0025169288273900747 2023-01-22 19:53:50.993318: step: 308/530, loss: 0.005093428771942854 2023-01-22 19:53:52.081308: step: 312/530, loss: 0.0043222238309681416 2023-01-22 19:53:53.200663: step: 316/530, loss: 0.007977612316608429 2023-01-22 19:53:54.280645: step: 320/530, loss: 0.0004820974136237055 2023-01-22 19:53:55.354229: step: 324/530, loss: 0.002975445007905364 2023-01-22 19:53:56.424965: step: 328/530, loss: 0.002435133093968034 2023-01-22 19:53:57.548021: step: 332/530, loss: 0.0035984329879283905 2023-01-22 19:53:58.650287: step: 336/530, loss: 0.0008130475180223584 2023-01-22 19:53:59.740299: step: 340/530, loss: 0.0005286601954139769 2023-01-22 19:54:00.844255: step: 344/530, loss: 0.03124627098441124 2023-01-22 19:54:01.940582: step: 348/530, loss: 0.004316762555390596 2023-01-22 19:54:03.070206: step: 352/530, loss: 0.002753043081611395 2023-01-22 19:54:04.163332: step: 356/530, loss: 0.004522338975220919 2023-01-22 19:54:05.233708: step: 360/530, loss: 4.239913323544897e-06 2023-01-22 19:54:06.358351: step: 364/530, loss: 0.002400033175945282 2023-01-22 19:54:07.434283: step: 368/530, loss: 0.0008092439966276288 2023-01-22 19:54:08.527729: step: 372/530, loss: 0.006402950268238783 2023-01-22 19:54:09.606242: step: 376/530, loss: 0.0034164160024374723 2023-01-22 19:54:10.709205: step: 380/530, loss: 0.00027832461637444794 2023-01-22 19:54:11.801903: step: 384/530, loss: 0.0016440374311059713 2023-01-22 19:54:12.888039: step: 388/530, loss: 0.0007841635379008949 2023-01-22 19:54:13.975376: step: 392/530, loss: 0.0018719471991062164 2023-01-22 19:54:15.054388: step: 396/530, loss: 0.0010516648180782795 2023-01-22 19:54:16.136548: step: 400/530, loss: 0.00862325169146061 2023-01-22 19:54:17.232581: step: 404/530, loss: 0.006379847414791584 2023-01-22 19:54:18.321699: step: 408/530, loss: 0.0010357204591855407 2023-01-22 19:54:19.418144: step: 412/530, loss: 0.008124977350234985 2023-01-22 19:54:20.537693: step: 416/530, loss: 0.0010897415922954679 2023-01-22 19:54:21.627179: step: 420/530, loss: 0.007163804490119219 2023-01-22 19:54:22.728371: step: 424/530, loss: 0.0009442644077353179 2023-01-22 19:54:23.828625: step: 428/530, loss: 0.0017286279471591115 2023-01-22 19:54:24.900679: step: 432/530, loss: 0.007969128899276257 2023-01-22 19:54:25.975857: step: 436/530, loss: 0.0007324569160118699 2023-01-22 19:54:27.051220: step: 440/530, loss: 0.00875879917293787 2023-01-22 19:54:28.135862: step: 444/530, loss: 0.007760476320981979 2023-01-22 19:54:29.229222: step: 448/530, loss: 0.0014678913867101073 2023-01-22 19:54:30.324068: step: 452/530, loss: 1.8849799744202755e-05 2023-01-22 19:54:31.389921: step: 456/530, loss: 0.01136686559766531 2023-01-22 19:54:32.482849: step: 460/530, loss: 0.0040018693543970585 2023-01-22 19:54:33.587258: step: 464/530, loss: 0.003364595817402005 2023-01-22 19:54:34.661102: step: 468/530, loss: 0.001970995217561722 2023-01-22 19:54:35.733043: step: 472/530, loss: 0.0007398941088467836 2023-01-22 19:54:36.828978: step: 476/530, loss: 0.004584888927638531 2023-01-22 19:54:37.899947: step: 480/530, loss: 0.0002695714065339416 2023-01-22 19:54:38.990298: step: 484/530, loss: 0.0005539420526474714 2023-01-22 19:54:40.073915: step: 488/530, loss: 0.025037281215190887 2023-01-22 19:54:41.156317: step: 492/530, loss: 0.0032129879109561443 2023-01-22 19:54:42.265566: step: 496/530, loss: 0.00039441286935471 2023-01-22 19:54:43.367450: step: 500/530, loss: 0.004720891825854778 2023-01-22 19:54:44.457933: step: 504/530, loss: 0.0011298924218863249 2023-01-22 19:54:45.543444: step: 508/530, loss: 0.00041900365613400936 2023-01-22 19:54:46.645102: step: 512/530, loss: 4.196471854811534e-05 2023-01-22 19:54:47.775108: step: 516/530, loss: 0.013871035538613796 2023-01-22 19:54:48.853310: step: 520/530, loss: 0.00013691623462364078 2023-01-22 19:54:49.954602: step: 524/530, loss: 0.008406477980315685 2023-01-22 19:54:51.040928: step: 528/530, loss: 0.003086388809606433 2023-01-22 19:54:52.121046: step: 532/530, loss: 0.006190589163452387 2023-01-22 19:54:53.197432: step: 536/530, loss: 0.007421389222145081 2023-01-22 19:54:54.292959: step: 540/530, loss: 0.002495412714779377 2023-01-22 19:54:55.390136: step: 544/530, loss: 0.007445516996085644 2023-01-22 19:54:56.489954: step: 548/530, loss: 0.0011785250389948487 2023-01-22 19:54:57.571951: step: 552/530, loss: 0.0008654675912111998 2023-01-22 19:54:58.673391: step: 556/530, loss: 0.00025137377087958157 2023-01-22 19:54:59.744891: step: 560/530, loss: 0.00017511122860014439 2023-01-22 19:55:00.837951: step: 564/530, loss: 5.7159009884344414e-05 2023-01-22 19:55:01.927727: step: 568/530, loss: 0.016914788633584976 2023-01-22 19:55:03.002903: step: 572/530, loss: 0.0009976305300369859 2023-01-22 19:55:04.099262: step: 576/530, loss: 0.0006685921689495444 2023-01-22 19:55:05.198143: step: 580/530, loss: 0.0037347576580941677 2023-01-22 19:55:06.277220: step: 584/530, loss: 0.0013946848921477795 2023-01-22 19:55:07.371983: step: 588/530, loss: 0.003970451653003693 2023-01-22 19:55:08.449697: step: 592/530, loss: 0.0001628063910175115 2023-01-22 19:55:09.538846: step: 596/530, loss: 0.0008422298706136644 2023-01-22 19:55:10.612098: step: 600/530, loss: 0.00029587431345134974 2023-01-22 19:55:11.698802: step: 604/530, loss: 0.0006361801060847938 2023-01-22 19:55:12.800895: step: 608/530, loss: 0.0034885662607848644 2023-01-22 19:55:13.875998: step: 612/530, loss: 0.0003585990925785154 2023-01-22 19:55:14.937152: step: 616/530, loss: 2.5604125767131336e-05 2023-01-22 19:55:16.036875: step: 620/530, loss: 0.0016611746978014708 2023-01-22 19:55:17.117379: step: 624/530, loss: 0.002439285861328244 2023-01-22 19:55:18.201491: step: 628/530, loss: 3.925748387700878e-05 2023-01-22 19:55:19.287573: step: 632/530, loss: 0.0038144635036587715 2023-01-22 19:55:20.388615: step: 636/530, loss: 0.01120692491531372 2023-01-22 19:55:21.452521: step: 640/530, loss: 2.340239916520659e-05 2023-01-22 19:55:22.542004: step: 644/530, loss: 0.0017313751159235835 2023-01-22 19:55:23.635824: step: 648/530, loss: 0.0017275534337386489 2023-01-22 19:55:24.724851: step: 652/530, loss: 2.3065988443704555e-06 2023-01-22 19:55:25.819182: step: 656/530, loss: 0.0029233889654278755 2023-01-22 19:55:26.909229: step: 660/530, loss: 0.0032414367888122797 2023-01-22 19:55:27.994354: step: 664/530, loss: 0.006235004402697086 2023-01-22 19:55:29.085526: step: 668/530, loss: 0.0024263113737106323 2023-01-22 19:55:30.175412: step: 672/530, loss: 0.0033212851267307997 2023-01-22 19:55:31.271390: step: 676/530, loss: 7.125129195628688e-05 2023-01-22 19:55:32.355384: step: 680/530, loss: 0.0008174025570042431 2023-01-22 19:55:33.454776: step: 684/530, loss: 0.006060808897018433 2023-01-22 19:55:34.512854: step: 688/530, loss: 0.0027228742837905884 2023-01-22 19:55:35.600107: step: 692/530, loss: 0.002320940140634775 2023-01-22 19:55:36.681791: step: 696/530, loss: 0.0010438866447657347 2023-01-22 19:55:37.744901: step: 700/530, loss: 0.004476509522646666 2023-01-22 19:55:38.853453: step: 704/530, loss: 0.0029681925661861897 2023-01-22 19:55:39.939711: step: 708/530, loss: 0.00013709232734981924 2023-01-22 19:55:41.020649: step: 712/530, loss: 0.006894290912896395 2023-01-22 19:55:42.117052: step: 716/530, loss: 0.0019235251238569617 2023-01-22 19:55:43.203565: step: 720/530, loss: 0.0003483947948552668 2023-01-22 19:55:44.271524: step: 724/530, loss: 0.0012323943665251136 2023-01-22 19:55:45.371537: step: 728/530, loss: 0.0049696979112923145 2023-01-22 19:55:46.438084: step: 732/530, loss: 0.00313419452868402 2023-01-22 19:55:47.522835: step: 736/530, loss: 0.0002585958573035896 2023-01-22 19:55:48.593803: step: 740/530, loss: 0.002907141810283065 2023-01-22 19:55:49.669519: step: 744/530, loss: 0.0005720037734135985 2023-01-22 19:55:50.768734: step: 748/530, loss: 0.09205687046051025 2023-01-22 19:55:51.871863: step: 752/530, loss: 0.0011814923491328955 2023-01-22 19:55:52.947525: step: 756/530, loss: 0.0026381819043308496 2023-01-22 19:55:54.037336: step: 760/530, loss: 4.626006193575449e-05 2023-01-22 19:55:55.107870: step: 764/530, loss: 0.015169908292591572 2023-01-22 19:55:56.192802: step: 768/530, loss: 0.005272774491459131 2023-01-22 19:55:57.276222: step: 772/530, loss: 0.003081422531977296 2023-01-22 19:55:58.381272: step: 776/530, loss: 0.0010419772006571293 2023-01-22 19:55:59.495807: step: 780/530, loss: 0.0028410006780177355 2023-01-22 19:56:00.606633: step: 784/530, loss: 0.010967368260025978 2023-01-22 19:56:01.670256: step: 788/530, loss: 0.008490442298352718 2023-01-22 19:56:02.749347: step: 792/530, loss: 0.004188038408756256 2023-01-22 19:56:03.851745: step: 796/530, loss: 0.00353723275475204 2023-01-22 19:56:04.960442: step: 800/530, loss: 0.008835950866341591 2023-01-22 19:56:06.058780: step: 804/530, loss: 0.014122353866696358 2023-01-22 19:56:07.131330: step: 808/530, loss: 0.0019575064070522785 2023-01-22 19:56:08.225754: step: 812/530, loss: 0.0001283080637222156 2023-01-22 19:56:09.320416: step: 816/530, loss: 0.006627049762755632 2023-01-22 19:56:10.383832: step: 820/530, loss: 0.0010814443230628967 2023-01-22 19:56:11.451299: step: 824/530, loss: 0.0007403788040392101 2023-01-22 19:56:12.551838: step: 828/530, loss: 0.002512782346457243 2023-01-22 19:56:13.682562: step: 832/530, loss: 0.00648350128903985 2023-01-22 19:56:14.798561: step: 836/530, loss: 0.006590052507817745 2023-01-22 19:56:15.888223: step: 840/530, loss: 0.00013365535414777696 2023-01-22 19:56:16.985197: step: 844/530, loss: 0.005512470379471779 2023-01-22 19:56:18.070522: step: 848/530, loss: 0.0005471798358485103 2023-01-22 19:56:19.184940: step: 852/530, loss: 0.006437006406486034 2023-01-22 19:56:20.262029: step: 856/530, loss: 0.0017111505148932338 2023-01-22 19:56:21.334131: step: 860/530, loss: 0.0020091054029762745 2023-01-22 19:56:22.418677: step: 864/530, loss: 0.0004005547962151468 2023-01-22 19:56:23.501195: step: 868/530, loss: 0.002750362968072295 2023-01-22 19:56:24.585983: step: 872/530, loss: 0.005676696542650461 2023-01-22 19:56:25.685440: step: 876/530, loss: 0.0051183272153139114 2023-01-22 19:56:26.763012: step: 880/530, loss: 0.0007667641621083021 2023-01-22 19:56:27.839075: step: 884/530, loss: 0.0025634237099438906 2023-01-22 19:56:28.902951: step: 888/530, loss: 0.0021997729782015085 2023-01-22 19:56:30.008834: step: 892/530, loss: 0.00013588348519988358 2023-01-22 19:56:31.096503: step: 896/530, loss: 0.01640518195927143 2023-01-22 19:56:32.177822: step: 900/530, loss: 0.0008989162743091583 2023-01-22 19:56:33.275836: step: 904/530, loss: 0.001824555336497724 2023-01-22 19:56:34.358905: step: 908/530, loss: 0.0010768282227218151 2023-01-22 19:56:35.454790: step: 912/530, loss: 0.004957268945872784 2023-01-22 19:56:36.540935: step: 916/530, loss: 0.00736016733571887 2023-01-22 19:56:37.651683: step: 920/530, loss: 0.004380638711154461 2023-01-22 19:56:38.725597: step: 924/530, loss: 0.002497141482308507 2023-01-22 19:56:39.794027: step: 928/530, loss: 0.001268291613087058 2023-01-22 19:56:40.883739: step: 932/530, loss: 0.0005254681454971433 2023-01-22 19:56:42.013637: step: 936/530, loss: 0.002369712106883526 2023-01-22 19:56:43.102609: step: 940/530, loss: 0.0008978047408163548 2023-01-22 19:56:44.193697: step: 944/530, loss: 0.04146760702133179 2023-01-22 19:56:45.259446: step: 948/530, loss: 0.0008567434852011502 2023-01-22 19:56:46.347725: step: 952/530, loss: 0.00290684518404305 2023-01-22 19:56:47.415040: step: 956/530, loss: 0.00016746077744755894 2023-01-22 19:56:48.492787: step: 960/530, loss: 0.0019771752413362265 2023-01-22 19:56:49.586804: step: 964/530, loss: 0.0019547496922314167 2023-01-22 19:56:50.690446: step: 968/530, loss: 0.006751535460352898 2023-01-22 19:56:51.780559: step: 972/530, loss: 2.4312272216775455e-05 2023-01-22 19:56:52.862709: step: 976/530, loss: 0.004235660657286644 2023-01-22 19:56:53.951177: step: 980/530, loss: 0.011990902945399284 2023-01-22 19:56:55.064513: step: 984/530, loss: 0.001053488813340664 2023-01-22 19:56:56.175722: step: 988/530, loss: 0.0004209255857858807 2023-01-22 19:56:57.262050: step: 992/530, loss: 5.6086522818077356e-05 2023-01-22 19:56:58.344845: step: 996/530, loss: 0.0005520488484762609 2023-01-22 19:56:59.425911: step: 1000/530, loss: 0.00023184662859421223 2023-01-22 19:57:00.513381: step: 1004/530, loss: 2.11595477139781e-07 2023-01-22 19:57:01.611812: step: 1008/530, loss: 0.013235863298177719 2023-01-22 19:57:02.700183: step: 1012/530, loss: 0.010187349282205105 2023-01-22 19:57:03.787674: step: 1016/530, loss: 0.005687339697033167 2023-01-22 19:57:04.876633: step: 1020/530, loss: 0.0017560739070177078 2023-01-22 19:57:05.965653: step: 1024/530, loss: 0.0026939495000988245 2023-01-22 19:57:07.084232: step: 1028/530, loss: 0.007238706108182669 2023-01-22 19:57:08.162569: step: 1032/530, loss: 0.00013601387036032975 2023-01-22 19:57:09.244138: step: 1036/530, loss: 0.00045989060890860856 2023-01-22 19:57:10.328542: step: 1040/530, loss: 0.0032810233533382416 2023-01-22 19:57:11.413182: step: 1044/530, loss: 0.0004015865852124989 2023-01-22 19:57:12.551775: step: 1048/530, loss: 0.013448178768157959 2023-01-22 19:57:13.626933: step: 1052/530, loss: 0.003856315743178129 2023-01-22 19:57:14.780382: step: 1056/530, loss: 0.0005450118915177882 2023-01-22 19:57:15.847667: step: 1060/530, loss: 0.0 2023-01-22 19:57:16.934859: step: 1064/530, loss: 0.0008792424923740327 2023-01-22 19:57:18.028637: step: 1068/530, loss: 0.00823802500963211 2023-01-22 19:57:19.113211: step: 1072/530, loss: 2.6319603421143256e-06 2023-01-22 19:57:20.180242: step: 1076/530, loss: 0.0008064648136496544 2023-01-22 19:57:21.287682: step: 1080/530, loss: 0.006718065589666367 2023-01-22 19:57:22.389075: step: 1084/530, loss: 0.00017420953372493386 2023-01-22 19:57:23.500915: step: 1088/530, loss: 0.002185078337788582 2023-01-22 19:57:24.595350: step: 1092/530, loss: 0.00019640305254142731 2023-01-22 19:57:25.679809: step: 1096/530, loss: 0.006831278093159199 2023-01-22 19:57:26.755296: step: 1100/530, loss: 4.614041972672567e-05 2023-01-22 19:57:27.854539: step: 1104/530, loss: 0.0032910217996686697 2023-01-22 19:57:28.933586: step: 1108/530, loss: 0.0009668187703937292 2023-01-22 19:57:30.018700: step: 1112/530, loss: 0.0004408480308484286 2023-01-22 19:57:31.081115: step: 1116/530, loss: 0.0020132348872721195 2023-01-22 19:57:32.151304: step: 1120/530, loss: 0.005592492874711752 2023-01-22 19:57:33.236016: step: 1124/530, loss: 0.0005681593902409077 2023-01-22 19:57:34.313187: step: 1128/530, loss: 0.03897804021835327 2023-01-22 19:57:35.395114: step: 1132/530, loss: 0.014552135951817036 2023-01-22 19:57:36.489579: step: 1136/530, loss: 0.007389168720692396 2023-01-22 19:57:37.597881: step: 1140/530, loss: 0.0010538259521126747 2023-01-22 19:57:38.728784: step: 1144/530, loss: 0.0072760749608278275 2023-01-22 19:57:39.810791: step: 1148/530, loss: 0.001881799311377108 2023-01-22 19:57:40.882891: step: 1152/530, loss: 0.0050290850922465324 2023-01-22 19:57:41.977484: step: 1156/530, loss: 0.009101685136556625 2023-01-22 19:57:43.051954: step: 1160/530, loss: 0.0004510745930019766 2023-01-22 19:57:44.137996: step: 1164/530, loss: 0.0022820280864834785 2023-01-22 19:57:45.229949: step: 1168/530, loss: 0.0004817323060706258 2023-01-22 19:57:46.320522: step: 1172/530, loss: 0.017603395506739616 2023-01-22 19:57:47.391166: step: 1176/530, loss: 0.0006317555671557784 2023-01-22 19:57:48.472219: step: 1180/530, loss: 0.0017889713635668159 2023-01-22 19:57:49.558081: step: 1184/530, loss: 0.010875473730266094 2023-01-22 19:57:50.656502: step: 1188/530, loss: 0.004709660075604916 2023-01-22 19:57:51.733116: step: 1192/530, loss: 0.0010572028113529086 2023-01-22 19:57:52.794539: step: 1196/530, loss: 0.0007839778554625809 2023-01-22 19:57:53.889074: step: 1200/530, loss: 0.004494942259043455 2023-01-22 19:57:54.970724: step: 1204/530, loss: 0.0024047312326729298 2023-01-22 19:57:56.057128: step: 1208/530, loss: 0.0023907735012471676 2023-01-22 19:57:57.142361: step: 1212/530, loss: 5.270205747365253e-06 2023-01-22 19:57:58.264000: step: 1216/530, loss: 0.003890441497787833 2023-01-22 19:57:59.351977: step: 1220/530, loss: 0.001387719064950943 2023-01-22 19:58:00.439634: step: 1224/530, loss: 0.0012261300580576062 2023-01-22 19:58:01.529880: step: 1228/530, loss: 0.009833861142396927 2023-01-22 19:58:02.628565: step: 1232/530, loss: 0.010457347147166729 2023-01-22 19:58:03.726458: step: 1236/530, loss: 0.0009336344082839787 2023-01-22 19:58:04.788397: step: 1240/530, loss: 0.003212392795830965 2023-01-22 19:58:05.884500: step: 1244/530, loss: 0.0008669504313729703 2023-01-22 19:58:06.975416: step: 1248/530, loss: 0.00018693390302360058 2023-01-22 19:58:08.051513: step: 1252/530, loss: 0.0009722743998281658 2023-01-22 19:58:09.170387: step: 1256/530, loss: 0.006682408507913351 2023-01-22 19:58:10.254619: step: 1260/530, loss: 0.004756182432174683 2023-01-22 19:58:11.329454: step: 1264/530, loss: 0.0004418453900143504 2023-01-22 19:58:12.420862: step: 1268/530, loss: 0.012299046851694584 2023-01-22 19:58:13.536293: step: 1272/530, loss: 0.0004543860559351742 2023-01-22 19:58:14.628716: step: 1276/530, loss: 0.004451368935406208 2023-01-22 19:58:15.698817: step: 1280/530, loss: 0.0016371669480577111 2023-01-22 19:58:16.798016: step: 1284/530, loss: 0.001994268735870719 2023-01-22 19:58:17.867027: step: 1288/530, loss: 0.0020643984898924828 2023-01-22 19:58:18.927503: step: 1292/530, loss: 0.0007742835441604257 2023-01-22 19:58:20.000666: step: 1296/530, loss: 0.00020217744167894125 2023-01-22 19:58:21.085832: step: 1300/530, loss: 0.001714938087388873 2023-01-22 19:58:22.156273: step: 1304/530, loss: 0.00015804576105438173 2023-01-22 19:58:23.232600: step: 1308/530, loss: 3.625944009399973e-05 2023-01-22 19:58:24.311377: step: 1312/530, loss: 0.009256994351744652 2023-01-22 19:58:25.377898: step: 1316/530, loss: 6.166958337416872e-05 2023-01-22 19:58:26.450510: step: 1320/530, loss: 0.00343429041095078 2023-01-22 19:58:27.551451: step: 1324/530, loss: 0.00027316107298247516 2023-01-22 19:58:28.653584: step: 1328/530, loss: 0.0020564028527587652 2023-01-22 19:58:29.737992: step: 1332/530, loss: 0.004720047581940889 2023-01-22 19:58:30.818321: step: 1336/530, loss: 8.517401874996722e-05 2023-01-22 19:58:31.902011: step: 1340/530, loss: 0.0013121734373271465 2023-01-22 19:58:33.025865: step: 1344/530, loss: 0.005484965164214373 2023-01-22 19:58:34.102178: step: 1348/530, loss: 0.00012013780360575765 2023-01-22 19:58:35.217570: step: 1352/530, loss: 0.023909686133265495 2023-01-22 19:58:36.280750: step: 1356/530, loss: 0.0004580010718200356 2023-01-22 19:58:37.373491: step: 1360/530, loss: 8.234806045948062e-06 2023-01-22 19:58:38.481435: step: 1364/530, loss: 0.001918577472679317 2023-01-22 19:58:39.574286: step: 1368/530, loss: 0.003393137827515602 2023-01-22 19:58:40.633958: step: 1372/530, loss: 0.00019939703634008765 2023-01-22 19:58:41.743142: step: 1376/530, loss: 0.00010725236643338576 2023-01-22 19:58:42.829467: step: 1380/530, loss: 0.00024035417300183326 2023-01-22 19:58:43.904510: step: 1384/530, loss: 0.028011364862322807 2023-01-22 19:58:45.003975: step: 1388/530, loss: 0.0021849924232810736 2023-01-22 19:58:46.083466: step: 1392/530, loss: 0.0009893151000142097 2023-01-22 19:58:47.164829: step: 1396/530, loss: 0.002132462104782462 2023-01-22 19:58:48.247005: step: 1400/530, loss: 7.176028884714469e-05 2023-01-22 19:58:49.323158: step: 1404/530, loss: 0.022018464282155037 2023-01-22 19:58:50.404317: step: 1408/530, loss: 0.007787796203047037 2023-01-22 19:58:51.492186: step: 1412/530, loss: 0.002511626807972789 2023-01-22 19:58:52.587417: step: 1416/530, loss: 0.009674613364040852 2023-01-22 19:58:53.671485: step: 1420/530, loss: 2.9385002562776208e-05 2023-01-22 19:58:54.769995: step: 1424/530, loss: 0.0014973906800150871 2023-01-22 19:58:55.848128: step: 1428/530, loss: 0.07004883885383606 2023-01-22 19:58:56.941083: step: 1432/530, loss: 1.74994274857454e-05 2023-01-22 19:58:58.024853: step: 1436/530, loss: 0.0010433431016281247 2023-01-22 19:58:59.095030: step: 1440/530, loss: 0.0004845707444474101 2023-01-22 19:59:00.163580: step: 1444/530, loss: 0.0019190305611118674 2023-01-22 19:59:01.270242: step: 1448/530, loss: 0.003605431178584695 2023-01-22 19:59:02.365003: step: 1452/530, loss: 0.0008017189684323967 2023-01-22 19:59:03.454645: step: 1456/530, loss: 0.004502593539655209 2023-01-22 19:59:04.534414: step: 1460/530, loss: 0.00550076412037015 2023-01-22 19:59:05.616010: step: 1464/530, loss: 0.0018752755131572485 2023-01-22 19:59:06.729718: step: 1468/530, loss: 0.005419633816927671 2023-01-22 19:59:07.795158: step: 1472/530, loss: 0.0027900550048798323 2023-01-22 19:59:08.882161: step: 1476/530, loss: 0.005146119277924299 2023-01-22 19:59:09.972143: step: 1480/530, loss: 0.00032300723250955343 2023-01-22 19:59:11.066184: step: 1484/530, loss: 0.0007106717675924301 2023-01-22 19:59:12.133702: step: 1488/530, loss: 5.9772269196400885e-06 2023-01-22 19:59:13.210063: step: 1492/530, loss: 0.005116772372275591 2023-01-22 19:59:14.331945: step: 1496/530, loss: 0.006594047416001558 2023-01-22 19:59:15.408387: step: 1500/530, loss: 0.0037953134160488844 2023-01-22 19:59:16.500944: step: 1504/530, loss: 0.012371010147035122 2023-01-22 19:59:17.605811: step: 1508/530, loss: 0.004237303975969553 2023-01-22 19:59:18.709167: step: 1512/530, loss: 2.643659354362171e-05 2023-01-22 19:59:19.806540: step: 1516/530, loss: 0.015276732854545116 2023-01-22 19:59:20.898617: step: 1520/530, loss: 0.0010161424288526177 2023-01-22 19:59:21.976148: step: 1524/530, loss: 1.3737771041633096e-05 2023-01-22 19:59:23.053740: step: 1528/530, loss: 0.001201915554702282 2023-01-22 19:59:24.140811: step: 1532/530, loss: 0.025990746915340424 2023-01-22 19:59:25.236966: step: 1536/530, loss: 0.001058524358086288 2023-01-22 19:59:26.315003: step: 1540/530, loss: 0.0003789604816120118 2023-01-22 19:59:27.408229: step: 1544/530, loss: 0.0069553544744849205 2023-01-22 19:59:28.485311: step: 1548/530, loss: 0.00045877540833316743 2023-01-22 19:59:29.567624: step: 1552/530, loss: 0.0001989740558201447 2023-01-22 19:59:30.651560: step: 1556/530, loss: 0.0026985194999724627 2023-01-22 19:59:31.739844: step: 1560/530, loss: 0.0009219951462000608 2023-01-22 19:59:32.810497: step: 1564/530, loss: 0.0033113141544163227 2023-01-22 19:59:33.901401: step: 1568/530, loss: 0.0035611242055892944 2023-01-22 19:59:35.030530: step: 1572/530, loss: 0.004538318142294884 2023-01-22 19:59:36.099134: step: 1576/530, loss: 0.004159430041909218 2023-01-22 19:59:37.201598: step: 1580/530, loss: 0.0006233225576579571 2023-01-22 19:59:38.302565: step: 1584/530, loss: 0.0005770657444372773 2023-01-22 19:59:39.386218: step: 1588/530, loss: 0.0011998669942840934 2023-01-22 19:59:40.476254: step: 1592/530, loss: 0.006901716813445091 2023-01-22 19:59:41.570967: step: 1596/530, loss: 0.02905910648405552 2023-01-22 19:59:42.656669: step: 1600/530, loss: 0.0024881402496248484 2023-01-22 19:59:43.754881: step: 1604/530, loss: 0.003927901852875948 2023-01-22 19:59:44.821582: step: 1608/530, loss: 0.0007349054212681949 2023-01-22 19:59:45.914250: step: 1612/530, loss: 0.0011800610227510333 2023-01-22 19:59:47.012389: step: 1616/530, loss: 0.02105814591050148 2023-01-22 19:59:48.075297: step: 1620/530, loss: 0.0015395227819681168 2023-01-22 19:59:49.180101: step: 1624/530, loss: 0.010922984220087528 2023-01-22 19:59:50.258105: step: 1628/530, loss: 0.008248801343142986 2023-01-22 19:59:51.360561: step: 1632/530, loss: 0.01618781127035618 2023-01-22 19:59:52.432539: step: 1636/530, loss: 0.02958204410970211 2023-01-22 19:59:53.528772: step: 1640/530, loss: 4.399966564960778e-05 2023-01-22 19:59:54.598973: step: 1644/530, loss: 0.001968149794265628 2023-01-22 19:59:55.698337: step: 1648/530, loss: 0.0005820642109028995 2023-01-22 19:59:56.756185: step: 1652/530, loss: 0.005752319935709238 2023-01-22 19:59:57.839195: step: 1656/530, loss: 0.0050523472018539906 2023-01-22 19:59:58.938931: step: 1660/530, loss: 0.001452722353860736 2023-01-22 20:00:00.018553: step: 1664/530, loss: 0.005445309914648533 2023-01-22 20:00:01.098419: step: 1668/530, loss: 1.1548379141856913e-08 2023-01-22 20:00:02.184012: step: 1672/530, loss: 0.00011109039769507945 2023-01-22 20:00:03.282694: step: 1676/530, loss: 0.0018030399223789573 2023-01-22 20:00:04.363235: step: 1680/530, loss: 0.005194325931370258 2023-01-22 20:00:05.476987: step: 1684/530, loss: 0.00385474250651896 2023-01-22 20:00:06.567723: step: 1688/530, loss: 0.007741323672235012 2023-01-22 20:00:07.663328: step: 1692/530, loss: 0.01495644822716713 2023-01-22 20:00:08.773890: step: 1696/530, loss: 0.01685008406639099 2023-01-22 20:00:09.862293: step: 1700/530, loss: 0.0055544120259583 2023-01-22 20:00:10.980402: step: 1704/530, loss: 0.010248808190226555 2023-01-22 20:00:12.079575: step: 1708/530, loss: 0.011854437179863453 2023-01-22 20:00:13.166159: step: 1712/530, loss: 0.03471222519874573 2023-01-22 20:00:14.223764: step: 1716/530, loss: 0.0008398064528591931 2023-01-22 20:00:15.297273: step: 1720/530, loss: 0.0001746997149894014 2023-01-22 20:00:16.400573: step: 1724/530, loss: 0.0005755234742537141 2023-01-22 20:00:17.497397: step: 1728/530, loss: 0.0034256817307323217 2023-01-22 20:00:18.586440: step: 1732/530, loss: 0.021520541980862617 2023-01-22 20:00:19.683732: step: 1736/530, loss: 0.007916544564068317 2023-01-22 20:00:20.793539: step: 1740/530, loss: 0.0022996366024017334 2023-01-22 20:00:21.870429: step: 1744/530, loss: 0.0005643433541990817 2023-01-22 20:00:22.953418: step: 1748/530, loss: 0.0034838926512748003 2023-01-22 20:00:24.054696: step: 1752/530, loss: 0.03036956675350666 2023-01-22 20:00:25.132683: step: 1756/530, loss: 0.0007215047953650355 2023-01-22 20:00:26.205544: step: 1760/530, loss: 0.0019453135319054127 2023-01-22 20:00:27.281495: step: 1764/530, loss: 0.001330358674749732 2023-01-22 20:00:28.355654: step: 1768/530, loss: 0.007806940004229546 2023-01-22 20:00:29.447355: step: 1772/530, loss: 0.003456848906353116 2023-01-22 20:00:30.514240: step: 1776/530, loss: 0.005057643633335829 2023-01-22 20:00:31.602669: step: 1780/530, loss: 0.011384502053260803 2023-01-22 20:00:32.697938: step: 1784/530, loss: 0.011234925128519535 2023-01-22 20:00:33.763179: step: 1788/530, loss: 0.0047269645147025585 2023-01-22 20:00:34.863442: step: 1792/530, loss: 0.0001232069917023182 2023-01-22 20:00:35.950874: step: 1796/530, loss: 0.0016339218709617853 2023-01-22 20:00:37.056723: step: 1800/530, loss: 0.0014323396608233452 2023-01-22 20:00:38.149827: step: 1804/530, loss: 0.001967453630641103 2023-01-22 20:00:39.251886: step: 1808/530, loss: 0.009709027595818043 2023-01-22 20:00:40.321250: step: 1812/530, loss: 0.0005732905119657516 2023-01-22 20:00:41.423668: step: 1816/530, loss: 0.004624378867447376 2023-01-22 20:00:42.543288: step: 1820/530, loss: 0.0017234840197488666 2023-01-22 20:00:43.629222: step: 1824/530, loss: 6.280279194470495e-05 2023-01-22 20:00:44.726230: step: 1828/530, loss: 0.00363940536044538 2023-01-22 20:00:45.793014: step: 1832/530, loss: 0.0027547746431082487 2023-01-22 20:00:46.876991: step: 1836/530, loss: 0.006162369158118963 2023-01-22 20:00:47.967818: step: 1840/530, loss: 0.00149850535672158 2023-01-22 20:00:49.073333: step: 1844/530, loss: 0.004718123469501734 2023-01-22 20:00:50.158439: step: 1848/530, loss: 0.003149504540488124 2023-01-22 20:00:51.229046: step: 1852/530, loss: 0.00022196733334567398 2023-01-22 20:00:52.309199: step: 1856/530, loss: 0.006669645197689533 2023-01-22 20:00:53.440576: step: 1860/530, loss: 0.004956276621669531 2023-01-22 20:00:54.519629: step: 1864/530, loss: 0.002093520015478134 2023-01-22 20:00:55.604252: step: 1868/530, loss: 0.0007709778728894889 2023-01-22 20:00:56.696376: step: 1872/530, loss: 0.00627837935462594 2023-01-22 20:00:57.796577: step: 1876/530, loss: 0.005650392267853022 2023-01-22 20:00:58.895139: step: 1880/530, loss: 0.010585335083305836 2023-01-22 20:00:59.952530: step: 1884/530, loss: 6.372926691255998e-06 2023-01-22 20:01:01.047285: step: 1888/530, loss: 4.653074938687496e-05 2023-01-22 20:01:02.127386: step: 1892/530, loss: 0.010358398780226707 2023-01-22 20:01:03.216130: step: 1896/530, loss: 0.0019476724555715919 2023-01-22 20:01:04.307170: step: 1900/530, loss: 0.002111525274813175 2023-01-22 20:01:05.396573: step: 1904/530, loss: 0.001851673237979412 2023-01-22 20:01:06.482296: step: 1908/530, loss: 0.003778306767344475 2023-01-22 20:01:07.546520: step: 1912/530, loss: 0.0008608328062109649 2023-01-22 20:01:08.635387: step: 1916/530, loss: 0.0008358883787877858 2023-01-22 20:01:09.723972: step: 1920/530, loss: 0.002286526607349515 2023-01-22 20:01:10.787851: step: 1924/530, loss: 0.0006502037867903709 2023-01-22 20:01:11.874422: step: 1928/530, loss: 0.0028706425800919533 2023-01-22 20:01:12.951243: step: 1932/530, loss: 0.0030464837327599525 2023-01-22 20:01:14.070845: step: 1936/530, loss: 0.009233983233571053 2023-01-22 20:01:15.166479: step: 1940/530, loss: 0.024344248697161674 2023-01-22 20:01:16.265148: step: 1944/530, loss: 0.00017233123071491718 2023-01-22 20:01:17.314627: step: 1948/530, loss: 8.85099871084094e-05 2023-01-22 20:01:18.409581: step: 1952/530, loss: 0.015052702277898788 2023-01-22 20:01:19.507335: step: 1956/530, loss: 0.002015867503359914 2023-01-22 20:01:20.603134: step: 1960/530, loss: 0.009345891885459423 2023-01-22 20:01:21.689798: step: 1964/530, loss: 1.1462586371635552e-05 2023-01-22 20:01:22.775011: step: 1968/530, loss: 0.0023738304153084755 2023-01-22 20:01:23.849330: step: 1972/530, loss: 0.006011987570673227 2023-01-22 20:01:24.935939: step: 1976/530, loss: 0.0035228943452239037 2023-01-22 20:01:26.044366: step: 1980/530, loss: 0.006211179308593273 2023-01-22 20:01:27.117661: step: 1984/530, loss: 0.0008161471923813224 2023-01-22 20:01:28.182996: step: 1988/530, loss: 0.004560565575957298 2023-01-22 20:01:29.253549: step: 1992/530, loss: 0.000625628512352705 2023-01-22 20:01:30.344493: step: 1996/530, loss: 0.00011095472291344777 2023-01-22 20:01:31.424360: step: 2000/530, loss: 0.001555387512780726 2023-01-22 20:01:32.506425: step: 2004/530, loss: 0.00889945961534977 2023-01-22 20:01:33.584171: step: 2008/530, loss: 0.0014049547025933862 2023-01-22 20:01:34.669616: step: 2012/530, loss: 0.00033359084045514464 2023-01-22 20:01:35.769928: step: 2016/530, loss: 0.002479431452229619 2023-01-22 20:01:36.841278: step: 2020/530, loss: 0.00129645224660635 2023-01-22 20:01:37.934629: step: 2024/530, loss: 0.01016774121671915 2023-01-22 20:01:39.026003: step: 2028/530, loss: 0.004030562937259674 2023-01-22 20:01:40.119174: step: 2032/530, loss: 0.0014632843667641282 2023-01-22 20:01:41.190574: step: 2036/530, loss: 0.00033714438905008137 2023-01-22 20:01:42.298054: step: 2040/530, loss: 0.009767036885023117 2023-01-22 20:01:43.411280: step: 2044/530, loss: 0.012330167926847935 2023-01-22 20:01:44.499774: step: 2048/530, loss: 0.007674699183553457 2023-01-22 20:01:45.575566: step: 2052/530, loss: 0.005123947747051716 2023-01-22 20:01:46.648553: step: 2056/530, loss: 0.0001182538690045476 2023-01-22 20:01:47.721921: step: 2060/530, loss: 0.0014430314768105745 2023-01-22 20:01:48.810096: step: 2064/530, loss: 0.00013447781384456903 2023-01-22 20:01:49.902776: step: 2068/530, loss: 0.0013207438169047236 2023-01-22 20:01:50.991260: step: 2072/530, loss: 0.0016460088081657887 2023-01-22 20:01:52.053865: step: 2076/530, loss: 0.0016261229757219553 2023-01-22 20:01:53.134209: step: 2080/530, loss: 0.0006282105459831655 2023-01-22 20:01:54.240456: step: 2084/530, loss: 0.0004141568497288972 2023-01-22 20:01:55.328078: step: 2088/530, loss: 0.0039739953354001045 2023-01-22 20:01:56.415537: step: 2092/530, loss: 0.002581220120191574 2023-01-22 20:01:57.509688: step: 2096/530, loss: 0.006727252621203661 2023-01-22 20:01:58.604696: step: 2100/530, loss: 0.0035481418017297983 2023-01-22 20:01:59.675619: step: 2104/530, loss: 0.0016609999584034085 2023-01-22 20:02:00.779803: step: 2108/530, loss: 0.006071708630770445 2023-01-22 20:02:01.861555: step: 2112/530, loss: 0.00026346012600697577 2023-01-22 20:02:02.944879: step: 2116/530, loss: 8.357186743523926e-05 2023-01-22 20:02:04.017980: step: 2120/530, loss: 0.002504725707694888 ================================================== Loss: 0.004 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.33669626941685765, 'r': 0.3584186093792356, 'f1': 0.3472180278361345}, 'combined': 0.25584486261609907, 'stategy': 1, 'epoch': 14} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3370200415750063, 'r': 0.29001724645920424, 'f1': 0.3117569762575816}, 'combined': 0.19361749051786648, 'stategy': 1, 'epoch': 14} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3481342977158401, 'r': 0.3474737013254875, 'f1': 0.34780368584716415}, 'combined': 0.2562764000979104, 'stategy': 1, 'epoch': 14} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3188879784397555, 'r': 0.2873461408097105, 'f1': 0.3022965123398723}, 'combined': 0.18774204450581544, 'stategy': 1, 'epoch': 14} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3418569266734086, 'r': 0.3327753384885363, 'f1': 0.3372550065066512}, 'combined': 0.24850368900490086, 'stategy': 1, 'epoch': 14} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.346319521344185, 'r': 0.2970895005410629, 'f1': 0.3198211095091357}, 'combined': 0.19862574169514746, 'stategy': 1, 'epoch': 14} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 14} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 14} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 14} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 15 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 20:04:34.956542: step: 4/530, loss: 0.0005603269091807306 2023-01-22 20:04:36.041748: step: 8/530, loss: 0.0033836020156741142 2023-01-22 20:04:37.096667: step: 12/530, loss: 2.748173756117467e-05 2023-01-22 20:04:38.193845: step: 16/530, loss: 0.02031107433140278 2023-01-22 20:04:39.290560: step: 20/530, loss: 0.0024168984964489937 2023-01-22 20:04:40.362768: step: 24/530, loss: 0.0001324393815593794 2023-01-22 20:04:41.460626: step: 28/530, loss: 0.000845213420689106 2023-01-22 20:04:42.555139: step: 32/530, loss: 0.0005316843162290752 2023-01-22 20:04:43.620631: step: 36/530, loss: 1.4628681128669996e-05 2023-01-22 20:04:44.704879: step: 40/530, loss: 0.015268100425601006 2023-01-22 20:04:45.783984: step: 44/530, loss: 0.005782716907560825 2023-01-22 20:04:46.885141: step: 48/530, loss: 0.008466568775475025 2023-01-22 20:04:47.994633: step: 52/530, loss: 0.0008337254985235631 2023-01-22 20:04:49.104257: step: 56/530, loss: 0.010610067285597324 2023-01-22 20:04:50.188516: step: 60/530, loss: 0.002079881029203534 2023-01-22 20:04:51.273114: step: 64/530, loss: 0.0009238152415491641 2023-01-22 20:04:52.370891: step: 68/530, loss: 0.000500765978358686 2023-01-22 20:04:53.468006: step: 72/530, loss: 0.03360120952129364 2023-01-22 20:04:54.572167: step: 76/530, loss: 0.0009136134758591652 2023-01-22 20:04:55.663590: step: 80/530, loss: 0.003076310269534588 2023-01-22 20:04:56.741256: step: 84/530, loss: 0.001181140192784369 2023-01-22 20:04:57.816346: step: 88/530, loss: 0.00034104418591596186 2023-01-22 20:04:58.900081: step: 92/530, loss: 0.0012450501089915633 2023-01-22 20:04:59.983130: step: 96/530, loss: 0.0034340769052505493 2023-01-22 20:05:01.092427: step: 100/530, loss: 0.0008036938961595297 2023-01-22 20:05:02.169488: step: 104/530, loss: 7.929922139737755e-05 2023-01-22 20:05:03.259172: step: 108/530, loss: 0.0035339402966201305 2023-01-22 20:05:04.350640: step: 112/530, loss: 0.00012609059922397137 2023-01-22 20:05:05.435006: step: 116/530, loss: 0.0012745129643008113 2023-01-22 20:05:06.554972: step: 120/530, loss: 0.004408474545925856 2023-01-22 20:05:07.665245: step: 124/530, loss: 0.0007517550839111209 2023-01-22 20:05:08.757304: step: 128/530, loss: 0.00026374630397185683 2023-01-22 20:05:09.841891: step: 132/530, loss: 2.5531522624078207e-05 2023-01-22 20:05:10.937935: step: 136/530, loss: 0.001046914840117097 2023-01-22 20:05:12.040343: step: 140/530, loss: 0.003953760955482721 2023-01-22 20:05:13.123165: step: 144/530, loss: 0.0016117108752951026 2023-01-22 20:05:14.226201: step: 148/530, loss: 0.0038673526141792536 2023-01-22 20:05:15.312735: step: 152/530, loss: 0.0021993231493979692 2023-01-22 20:05:16.386297: step: 156/530, loss: 0.005202023778110743 2023-01-22 20:05:17.464841: step: 160/530, loss: 0.0026546542067080736 2023-01-22 20:05:18.555531: step: 164/530, loss: 0.012892602942883968 2023-01-22 20:05:19.663465: step: 168/530, loss: 0.0010452303104102612 2023-01-22 20:05:20.736888: step: 172/530, loss: 0.0026824157685041428 2023-01-22 20:05:21.832237: step: 176/530, loss: 0.0015785073628649116 2023-01-22 20:05:22.930984: step: 180/530, loss: 0.0007645704899914563 2023-01-22 20:05:24.018931: step: 184/530, loss: 0.002705469261854887 2023-01-22 20:05:25.096952: step: 188/530, loss: 0.005366666242480278 2023-01-22 20:05:26.175932: step: 192/530, loss: 0.0005622747703455389 2023-01-22 20:05:27.251087: step: 196/530, loss: 5.989646524540149e-06 2023-01-22 20:05:28.349306: step: 200/530, loss: 0.007668128702789545 2023-01-22 20:05:29.431897: step: 204/530, loss: 0.007374717853963375 2023-01-22 20:05:30.508242: step: 208/530, loss: 0.008534826338291168 2023-01-22 20:05:31.600713: step: 212/530, loss: 0.003811290254816413 2023-01-22 20:05:32.684705: step: 216/530, loss: 0.0015131818363443017 2023-01-22 20:05:33.790395: step: 220/530, loss: 0.00036347308196127415 2023-01-22 20:05:34.863701: step: 224/530, loss: 0.0031561492942273617 2023-01-22 20:05:35.936362: step: 228/530, loss: 0.0022700896952301264 2023-01-22 20:05:37.024259: step: 232/530, loss: 0.004300015978515148 2023-01-22 20:05:38.104142: step: 236/530, loss: 0.0002827040443662554 2023-01-22 20:05:39.212713: step: 240/530, loss: 0.0012241177028045058 2023-01-22 20:05:40.332837: step: 244/530, loss: 0.004503392614424229 2023-01-22 20:05:41.407713: step: 248/530, loss: 0.00039703870425000787 2023-01-22 20:05:42.538328: step: 252/530, loss: 0.0085066519677639 2023-01-22 20:05:43.636444: step: 256/530, loss: 0.0036142293829470873 2023-01-22 20:05:44.741180: step: 260/530, loss: 0.006109429989010096 2023-01-22 20:05:45.830031: step: 264/530, loss: 0.0015096550341695547 2023-01-22 20:05:46.933159: step: 268/530, loss: 0.0030760865192860365 2023-01-22 20:05:48.029999: step: 272/530, loss: 0.004289589822292328 2023-01-22 20:05:49.125177: step: 276/530, loss: 0.0021411217749118805 2023-01-22 20:05:50.212648: step: 280/530, loss: 4.426351370057091e-05 2023-01-22 20:05:51.284137: step: 284/530, loss: 9.423431038158014e-05 2023-01-22 20:05:52.347423: step: 288/530, loss: 0.004925564397126436 2023-01-22 20:05:53.438984: step: 292/530, loss: 0.0011611017398536205 2023-01-22 20:05:54.556518: step: 296/530, loss: 0.006216420326381922 2023-01-22 20:05:55.626881: step: 300/530, loss: 0.0058028195053339005 2023-01-22 20:05:56.739823: step: 304/530, loss: 0.00038804401992820203 2023-01-22 20:05:57.813305: step: 308/530, loss: 0.009510464034974575 2023-01-22 20:05:58.881942: step: 312/530, loss: 0.001831777160987258 2023-01-22 20:05:59.949807: step: 316/530, loss: 0.010432722046971321 2023-01-22 20:06:01.031623: step: 320/530, loss: 3.167520117131062e-05 2023-01-22 20:06:02.115224: step: 324/530, loss: 0.023967141285538673 2023-01-22 20:06:03.204022: step: 328/530, loss: 0.0031255523208528757 2023-01-22 20:06:04.328459: step: 332/530, loss: 0.0013823750196024776 2023-01-22 20:06:05.445019: step: 336/530, loss: 0.003276097821071744 2023-01-22 20:06:06.518292: step: 340/530, loss: 0.00030117094866000116 2023-01-22 20:06:07.610425: step: 344/530, loss: 0.004074622876942158 2023-01-22 20:06:08.711901: step: 348/530, loss: 0.00046580296475440264 2023-01-22 20:06:09.785274: step: 352/530, loss: 0.002189417602494359 2023-01-22 20:06:10.873583: step: 356/530, loss: 0.0030694399029016495 2023-01-22 20:06:11.997740: step: 360/530, loss: 0.017475778236985207 2023-01-22 20:06:13.085227: step: 364/530, loss: 0.003079014364629984 2023-01-22 20:06:14.187802: step: 368/530, loss: 0.0061907717026770115 2023-01-22 20:06:15.269867: step: 372/530, loss: 0.0037436443381011486 2023-01-22 20:06:16.363898: step: 376/530, loss: 0.0008974772645160556 2023-01-22 20:06:17.477026: step: 380/530, loss: 3.344173819641583e-05 2023-01-22 20:06:18.570732: step: 384/530, loss: 0.004639403894543648 2023-01-22 20:06:19.668065: step: 388/530, loss: 0.0012414584634825587 2023-01-22 20:06:20.761697: step: 392/530, loss: 0.0062952348962426186 2023-01-22 20:06:21.854766: step: 396/530, loss: 0.0005269868415780365 2023-01-22 20:06:22.928195: step: 400/530, loss: 0.0006903203902766109 2023-01-22 20:06:24.009534: step: 404/530, loss: 0.0017095323419198394 2023-01-22 20:06:25.075016: step: 408/530, loss: 0.009268923662602901 2023-01-22 20:06:26.137571: step: 412/530, loss: 1.6288953702314757e-05 2023-01-22 20:06:27.220350: step: 416/530, loss: 0.01433035172522068 2023-01-22 20:06:28.304126: step: 420/530, loss: 0.001576497801579535 2023-01-22 20:06:29.390952: step: 424/530, loss: 0.004388230852782726 2023-01-22 20:06:30.478359: step: 428/530, loss: 0.0004961317754350603 2023-01-22 20:06:31.560827: step: 432/530, loss: 0.003969933837652206 2023-01-22 20:06:32.635805: step: 436/530, loss: 0.0007683968869969249 2023-01-22 20:06:33.705514: step: 440/530, loss: 0.0010073124431073666 2023-01-22 20:06:34.782724: step: 444/530, loss: 0.0023505499120801687 2023-01-22 20:06:35.844997: step: 448/530, loss: 0.00015716916823294014 2023-01-22 20:06:36.931749: step: 452/530, loss: 0.0032290888484567404 2023-01-22 20:06:38.019416: step: 456/530, loss: 0.000613926153164357 2023-01-22 20:06:39.112490: step: 460/530, loss: 0.01097936648875475 2023-01-22 20:06:40.183241: step: 464/530, loss: 7.576760981464759e-05 2023-01-22 20:06:41.256034: step: 468/530, loss: 0.0012992059346288443 2023-01-22 20:06:42.348657: step: 472/530, loss: 0.004572598729282618 2023-01-22 20:06:43.425976: step: 476/530, loss: 0.0032610297203063965 2023-01-22 20:06:44.515773: step: 480/530, loss: 0.0022114189341664314 2023-01-22 20:06:45.605021: step: 484/530, loss: 0.0020829904824495316 2023-01-22 20:06:46.690200: step: 488/530, loss: 4.587047442328185e-05 2023-01-22 20:06:47.769697: step: 492/530, loss: 0.0026753153651952744 2023-01-22 20:06:48.865420: step: 496/530, loss: 0.0009746643481776118 2023-01-22 20:06:49.953963: step: 500/530, loss: 0.0019232332706451416 2023-01-22 20:06:51.024499: step: 504/530, loss: 0.005039873067289591 2023-01-22 20:06:52.113708: step: 508/530, loss: 0.01322495099157095 2023-01-22 20:06:53.200597: step: 512/530, loss: 0.008688376285135746 2023-01-22 20:06:54.286743: step: 516/530, loss: 0.04017927125096321 2023-01-22 20:06:55.385017: step: 520/530, loss: 0.0006335675716400146 2023-01-22 20:06:56.463177: step: 524/530, loss: 0.003151129698380828 2023-01-22 20:06:57.542023: step: 528/530, loss: 0.0003703125403262675 2023-01-22 20:06:58.626356: step: 532/530, loss: 0.013355312868952751 2023-01-22 20:06:59.733663: step: 536/530, loss: 8.864116534823552e-05 2023-01-22 20:07:00.831195: step: 540/530, loss: 0.0012442035367712379 2023-01-22 20:07:01.909647: step: 544/530, loss: 0.006936206016689539 2023-01-22 20:07:03.008054: step: 548/530, loss: 0.00932455062866211 2023-01-22 20:07:04.096666: step: 552/530, loss: 0.01208194438368082 2023-01-22 20:07:05.176311: step: 556/530, loss: 0.0007088372949510813 2023-01-22 20:07:06.283299: step: 560/530, loss: 0.000727538950741291 2023-01-22 20:07:07.379100: step: 564/530, loss: 0.0003795283264480531 2023-01-22 20:07:08.459167: step: 568/530, loss: 0.0003345249278936535 2023-01-22 20:07:09.536825: step: 572/530, loss: 3.2434752938570455e-05 2023-01-22 20:07:10.633397: step: 576/530, loss: 0.003163258545100689 2023-01-22 20:07:11.719051: step: 580/530, loss: 0.0026887848507612944 2023-01-22 20:07:12.830167: step: 584/530, loss: 0.003371400060132146 2023-01-22 20:07:13.931285: step: 588/530, loss: 5.6341796152992174e-05 2023-01-22 20:07:14.994277: step: 592/530, loss: 0.004009477328509092 2023-01-22 20:07:16.092954: step: 596/530, loss: 0.0024920590221881866 2023-01-22 20:07:17.181924: step: 600/530, loss: 0.00015841968706808984 2023-01-22 20:07:18.263973: step: 604/530, loss: 6.668202701121118e-08 2023-01-22 20:07:19.365334: step: 608/530, loss: 0.009033799171447754 2023-01-22 20:07:20.479870: step: 612/530, loss: 0.010294109582901001 2023-01-22 20:07:21.580738: step: 616/530, loss: 0.005923269782215357 2023-01-22 20:07:22.667255: step: 620/530, loss: 0.0005148897180333734 2023-01-22 20:07:23.751736: step: 624/530, loss: 0.004174213390797377 2023-01-22 20:07:24.818202: step: 628/530, loss: 4.9260168452747166e-05 2023-01-22 20:07:25.894482: step: 632/530, loss: 0.0013204978313297033 2023-01-22 20:07:26.979466: step: 636/530, loss: 0.00033934699604287744 2023-01-22 20:07:28.059532: step: 640/530, loss: 0.01224727276712656 2023-01-22 20:07:29.157973: step: 644/530, loss: 0.00040627815178595483 2023-01-22 20:07:30.272063: step: 648/530, loss: 0.003339530434459448 2023-01-22 20:07:31.382602: step: 652/530, loss: 0.008279840461909771 2023-01-22 20:07:32.460798: step: 656/530, loss: 0.0014663063921034336 2023-01-22 20:07:33.544377: step: 660/530, loss: 0.0018453781958669424 2023-01-22 20:07:34.642036: step: 664/530, loss: 0.004806226585060358 2023-01-22 20:07:35.726992: step: 668/530, loss: 0.008879673667252064 2023-01-22 20:07:36.822527: step: 672/530, loss: 0.0009397105895914137 2023-01-22 20:07:37.903372: step: 676/530, loss: 0.004249256569892168 2023-01-22 20:07:38.986881: step: 680/530, loss: 0.019687814638018608 2023-01-22 20:07:40.079505: step: 684/530, loss: 0.006677149794995785 2023-01-22 20:07:41.155564: step: 688/530, loss: 0.0019105913816019893 2023-01-22 20:07:42.257085: step: 692/530, loss: 0.001259146723896265 2023-01-22 20:07:43.342207: step: 696/530, loss: 4.184913632343523e-05 2023-01-22 20:07:44.432833: step: 700/530, loss: 0.0009217371698468924 2023-01-22 20:07:45.516681: step: 704/530, loss: 0.00031716443481855094 2023-01-22 20:07:46.594706: step: 708/530, loss: 0.012752840295433998 2023-01-22 20:07:47.681669: step: 712/530, loss: 0.005632590968161821 2023-01-22 20:07:48.785405: step: 716/530, loss: 6.445802227972308e-06 2023-01-22 20:07:49.866266: step: 720/530, loss: 0.0025948206894099712 2023-01-22 20:07:50.974405: step: 724/530, loss: 0.002619817154482007 2023-01-22 20:07:52.056495: step: 728/530, loss: 0.0004861385968979448 2023-01-22 20:07:53.149422: step: 732/530, loss: 0.0024453115183860064 2023-01-22 20:07:54.241311: step: 736/530, loss: 0.004731861874461174 2023-01-22 20:07:55.334244: step: 740/530, loss: 0.0013162607792764902 2023-01-22 20:07:56.431412: step: 744/530, loss: 0.000495178101118654 2023-01-22 20:07:57.491079: step: 748/530, loss: 2.0115919596719323e-07 2023-01-22 20:07:58.618324: step: 752/530, loss: 0.0007767449715174735 2023-01-22 20:07:59.720072: step: 756/530, loss: 0.0012465323088690639 2023-01-22 20:08:00.798359: step: 760/530, loss: 0.0005242686602286994 2023-01-22 20:08:01.879014: step: 764/530, loss: 0.0011807344853878021 2023-01-22 20:08:02.992897: step: 768/530, loss: 0.010948910377919674 2023-01-22 20:08:04.083638: step: 772/530, loss: 0.004480754490941763 2023-01-22 20:08:05.137592: step: 776/530, loss: 0.001311618136242032 2023-01-22 20:08:06.213561: step: 780/530, loss: 0.0002680454927030951 2023-01-22 20:08:07.302751: step: 784/530, loss: 0.0008214745903387666 2023-01-22 20:08:08.413420: step: 788/530, loss: 0.00015548574447166175 2023-01-22 20:08:09.521572: step: 792/530, loss: 0.000394105794839561 2023-01-22 20:08:10.616767: step: 796/530, loss: 0.004533532075583935 2023-01-22 20:08:11.707331: step: 800/530, loss: 0.0007221539854072034 2023-01-22 20:08:12.811105: step: 804/530, loss: 0.004022045060992241 2023-01-22 20:08:13.891492: step: 808/530, loss: 0.015345017425715923 2023-01-22 20:08:14.972910: step: 812/530, loss: 0.001496016513556242 2023-01-22 20:08:16.061546: step: 816/530, loss: 0.002786329947412014 2023-01-22 20:08:17.192593: step: 820/530, loss: 0.0059187584556639194 2023-01-22 20:08:18.264185: step: 824/530, loss: 0.0009018850978463888 2023-01-22 20:08:19.369887: step: 828/530, loss: 0.00019411362882237881 2023-01-22 20:08:20.446361: step: 832/530, loss: 0.0045598577708005905 2023-01-22 20:08:21.538168: step: 836/530, loss: 0.005649175029247999 2023-01-22 20:08:22.618496: step: 840/530, loss: 0.0059195104986429214 2023-01-22 20:08:23.690634: step: 844/530, loss: 0.00266664638184011 2023-01-22 20:08:24.785266: step: 848/530, loss: 0.006456125061959028 2023-01-22 20:08:25.858723: step: 852/530, loss: 0.0012606477830559015 2023-01-22 20:08:26.928896: step: 856/530, loss: 9.023839083965868e-05 2023-01-22 20:08:28.030396: step: 860/530, loss: 0.00177907501347363 2023-01-22 20:08:29.107906: step: 864/530, loss: 0.0024248322006314993 2023-01-22 20:08:30.200557: step: 868/530, loss: 0.0034812274388968945 2023-01-22 20:08:31.301859: step: 872/530, loss: 0.005492594558745623 2023-01-22 20:08:32.409669: step: 876/530, loss: 0.003532568458467722 2023-01-22 20:08:33.483721: step: 880/530, loss: 0.00010047259274870157 2023-01-22 20:08:34.572958: step: 884/530, loss: 0.0021263943053781986 2023-01-22 20:08:35.634379: step: 888/530, loss: 0.010426861234009266 2023-01-22 20:08:36.731496: step: 892/530, loss: 0.06476103514432907 2023-01-22 20:08:37.822597: step: 896/530, loss: 0.00402695732191205 2023-01-22 20:08:38.920129: step: 900/530, loss: 0.0034620303194969893 2023-01-22 20:08:40.027318: step: 904/530, loss: 0.0016567535931244493 2023-01-22 20:08:41.095723: step: 908/530, loss: 0.0008701797924004495 2023-01-22 20:08:42.189329: step: 912/530, loss: 0.0005422146059572697 2023-01-22 20:08:43.295041: step: 916/530, loss: 0.009410968981683254 2023-01-22 20:08:44.374779: step: 920/530, loss: 0.00418858602643013 2023-01-22 20:08:45.460239: step: 924/530, loss: 0.00023712597612757236 2023-01-22 20:08:46.549206: step: 928/530, loss: 0.00026911086752079427 2023-01-22 20:08:47.654774: step: 932/530, loss: 0.0010811963584274054 2023-01-22 20:08:48.750195: step: 936/530, loss: 0.005770714487880468 2023-01-22 20:08:49.816461: step: 940/530, loss: 0.0009019781136885285 2023-01-22 20:08:50.902031: step: 944/530, loss: 0.006315905135124922 2023-01-22 20:08:52.013733: step: 948/530, loss: 2.6591626010485925e-05 2023-01-22 20:08:53.104763: step: 952/530, loss: 0.003705458017066121 2023-01-22 20:08:54.203286: step: 956/530, loss: 0.0031867579091340303 2023-01-22 20:08:55.329665: step: 960/530, loss: 0.00012549081293400377 2023-01-22 20:08:56.412024: step: 964/530, loss: 0.00026949579478241503 2023-01-22 20:08:57.494925: step: 968/530, loss: 0.003759004408493638 2023-01-22 20:08:58.577914: step: 972/530, loss: 2.0215552467561793e-06 2023-01-22 20:08:59.644457: step: 976/530, loss: 0.001552699482999742 2023-01-22 20:09:00.742823: step: 980/530, loss: 1.6033138308557682e-05 2023-01-22 20:09:01.804084: step: 984/530, loss: 0.002237774431705475 2023-01-22 20:09:02.862003: step: 988/530, loss: 3.3042865652532782e-06 2023-01-22 20:09:03.958646: step: 992/530, loss: 0.010879520326852798 2023-01-22 20:09:05.031494: step: 996/530, loss: 0.010834017768502235 2023-01-22 20:09:06.109914: step: 1000/530, loss: 0.002442287979647517 2023-01-22 20:09:07.215739: step: 1004/530, loss: 0.011311542242765427 2023-01-22 20:09:08.290302: step: 1008/530, loss: 0.0002734313893597573 2023-01-22 20:09:09.381812: step: 1012/530, loss: 0.0036937897093594074 2023-01-22 20:09:10.453577: step: 1016/530, loss: 0.002512504579499364 2023-01-22 20:09:11.514651: step: 1020/530, loss: 0.0012993746204301715 2023-01-22 20:09:12.641464: step: 1024/530, loss: 0.002023993758484721 2023-01-22 20:09:13.714376: step: 1028/530, loss: 0.005852619186043739 2023-01-22 20:09:14.784138: step: 1032/530, loss: 4.5952849177410826e-05 2023-01-22 20:09:15.875282: step: 1036/530, loss: 0.0045895446091890335 2023-01-22 20:09:16.949746: step: 1040/530, loss: 0.0009423495503142476 2023-01-22 20:09:18.022475: step: 1044/530, loss: 0.0021403960417956114 2023-01-22 20:09:19.111262: step: 1048/530, loss: 0.005640462040901184 2023-01-22 20:09:20.204132: step: 1052/530, loss: 5.1703432291105855e-06 2023-01-22 20:09:21.293078: step: 1056/530, loss: 0.009345858357846737 2023-01-22 20:09:22.361831: step: 1060/530, loss: 0.0018892979715019464 2023-01-22 20:09:23.447805: step: 1064/530, loss: 0.005363785196095705 2023-01-22 20:09:24.533132: step: 1068/530, loss: 0.0011568197514861822 2023-01-22 20:09:25.631771: step: 1072/530, loss: 0.0003025837941095233 2023-01-22 20:09:26.754231: step: 1076/530, loss: 0.006940390449017286 2023-01-22 20:09:27.848940: step: 1080/530, loss: 2.688643871806562e-05 2023-01-22 20:09:28.920202: step: 1084/530, loss: 0.008109815418720245 2023-01-22 20:09:30.012228: step: 1088/530, loss: 0.0033530257642269135 2023-01-22 20:09:31.098692: step: 1092/530, loss: 0.0062082624062895775 2023-01-22 20:09:32.170242: step: 1096/530, loss: 0.0001378083397867158 2023-01-22 20:09:33.254401: step: 1100/530, loss: 0.0022450617980211973 2023-01-22 20:09:34.350919: step: 1104/530, loss: 0.002642890438437462 2023-01-22 20:09:35.469045: step: 1108/530, loss: 0.010595089755952358 2023-01-22 20:09:36.562695: step: 1112/530, loss: 0.0003634699387475848 2023-01-22 20:09:37.646618: step: 1116/530, loss: 0.006039982661604881 2023-01-22 20:09:38.748690: step: 1120/530, loss: 0.005501694045960903 2023-01-22 20:09:39.825644: step: 1124/530, loss: 0.00172157003544271 2023-01-22 20:09:40.908419: step: 1128/530, loss: 0.008069985546171665 2023-01-22 20:09:42.020785: step: 1132/530, loss: 0.003147716401144862 2023-01-22 20:09:43.098910: step: 1136/530, loss: 0.005004453007131815 2023-01-22 20:09:44.177890: step: 1140/530, loss: 0.002055081073194742 2023-01-22 20:09:45.255225: step: 1144/530, loss: 0.000731030770111829 2023-01-22 20:09:46.352717: step: 1148/530, loss: 9.636824688641354e-05 2023-01-22 20:09:47.421273: step: 1152/530, loss: 0.0017672054236754775 2023-01-22 20:09:48.530736: step: 1156/530, loss: 0.003239114535972476 2023-01-22 20:09:49.618458: step: 1160/530, loss: 0.02174297720193863 2023-01-22 20:09:50.682238: step: 1164/530, loss: 0.00011597121192608029 2023-01-22 20:09:51.773855: step: 1168/530, loss: 0.001182210398837924 2023-01-22 20:09:52.883713: step: 1172/530, loss: 0.0026390645653009415 2023-01-22 20:09:53.957525: step: 1176/530, loss: 0.0038202961441129446 2023-01-22 20:09:55.072186: step: 1180/530, loss: 0.0021490994840860367 2023-01-22 20:09:56.151478: step: 1184/530, loss: 0.001816555974073708 2023-01-22 20:09:57.232539: step: 1188/530, loss: 0.004720339085906744 2023-01-22 20:09:58.310438: step: 1192/530, loss: 0.0010220394469797611 2023-01-22 20:09:59.393071: step: 1196/530, loss: 0.0024166754446923733 2023-01-22 20:10:00.496297: step: 1200/530, loss: 0.004676496144384146 2023-01-22 20:10:01.579573: step: 1204/530, loss: 0.0033705593086779118 2023-01-22 20:10:02.669529: step: 1208/530, loss: 0.0032190699130296707 2023-01-22 20:10:03.761108: step: 1212/530, loss: 7.603576523251832e-05 2023-01-22 20:10:04.840397: step: 1216/530, loss: 0.010298809967935085 2023-01-22 20:10:05.936211: step: 1220/530, loss: 0.0012661231448873878 2023-01-22 20:10:07.030968: step: 1224/530, loss: 0.002544811926782131 2023-01-22 20:10:08.104418: step: 1228/530, loss: 0.0006274183979257941 2023-01-22 20:10:09.192471: step: 1232/530, loss: 0.0069658467546105385 2023-01-22 20:10:10.262791: step: 1236/530, loss: 0.00265141692943871 2023-01-22 20:10:11.361032: step: 1240/530, loss: 0.0022913615684956312 2023-01-22 20:10:12.453514: step: 1244/530, loss: 0.02095579355955124 2023-01-22 20:10:13.527141: step: 1248/530, loss: 0.0019135121256113052 2023-01-22 20:10:14.618502: step: 1252/530, loss: 0.0001453147706342861 2023-01-22 20:10:15.713462: step: 1256/530, loss: 0.005594421643763781 2023-01-22 20:10:16.819870: step: 1260/530, loss: 0.006734446622431278 2023-01-22 20:10:17.903721: step: 1264/530, loss: 0.0046421983279287815 2023-01-22 20:10:18.999584: step: 1268/530, loss: 0.007329718209803104 2023-01-22 20:10:20.082285: step: 1272/530, loss: 8.12764628790319e-05 2023-01-22 20:10:21.169691: step: 1276/530, loss: 5.270047768135555e-05 2023-01-22 20:10:22.257912: step: 1280/530, loss: 0.0004227318277116865 2023-01-22 20:10:23.337126: step: 1284/530, loss: 0.006260464433580637 2023-01-22 20:10:24.432080: step: 1288/530, loss: 0.005704643204808235 2023-01-22 20:10:25.518209: step: 1292/530, loss: 8.435212657786906e-05 2023-01-22 20:10:26.599394: step: 1296/530, loss: 0.0003714327176567167 2023-01-22 20:10:27.694731: step: 1300/530, loss: 0.004081703722476959 2023-01-22 20:10:28.774080: step: 1304/530, loss: 0.002183932112529874 2023-01-22 20:10:29.856436: step: 1308/530, loss: 0.002861962653696537 2023-01-22 20:10:30.927485: step: 1312/530, loss: 0.002355008153244853 2023-01-22 20:10:32.024149: step: 1316/530, loss: 0.0013220246182754636 2023-01-22 20:10:33.116831: step: 1320/530, loss: 0.0032330371905118227 2023-01-22 20:10:34.217928: step: 1324/530, loss: 0.009310531429946423 2023-01-22 20:10:35.316483: step: 1328/530, loss: 0.010981257073581219 2023-01-22 20:10:36.409577: step: 1332/530, loss: 0.013804920949041843 2023-01-22 20:10:37.466916: step: 1336/530, loss: 0.012152074836194515 2023-01-22 20:10:38.531617: step: 1340/530, loss: 0.0008176719420589507 2023-01-22 20:10:39.599348: step: 1344/530, loss: 2.639052581798751e-05 2023-01-22 20:10:40.699802: step: 1348/530, loss: 2.1447528979479102e-06 2023-01-22 20:10:41.799198: step: 1352/530, loss: 0.0005587259074673057 2023-01-22 20:10:42.877621: step: 1356/530, loss: 0.0034455277491360903 2023-01-22 20:10:43.974226: step: 1360/530, loss: 0.0007288409979082644 2023-01-22 20:10:45.057296: step: 1364/530, loss: 2.9353806894505396e-05 2023-01-22 20:10:46.157842: step: 1368/530, loss: 0.0013934716116636992 2023-01-22 20:10:47.223242: step: 1372/530, loss: 0.0023119293618947268 2023-01-22 20:10:48.300469: step: 1376/530, loss: 2.198658876295667e-05 2023-01-22 20:10:49.389837: step: 1380/530, loss: 0.006924602203071117 2023-01-22 20:10:50.475872: step: 1384/530, loss: 0.005602176766842604 2023-01-22 20:10:51.562559: step: 1388/530, loss: 1.759415135893505e-05 2023-01-22 20:10:52.632331: step: 1392/530, loss: 0.001758261932991445 2023-01-22 20:10:53.728526: step: 1396/530, loss: 0.001229122281074524 2023-01-22 20:10:54.819677: step: 1400/530, loss: 0.0002035643847193569 2023-01-22 20:10:55.936465: step: 1404/530, loss: 0.00043837804696522653 2023-01-22 20:10:57.032197: step: 1408/530, loss: 0.00032678412389941514 2023-01-22 20:10:58.143160: step: 1412/530, loss: 0.0036443667486310005 2023-01-22 20:10:59.206422: step: 1416/530, loss: 0.0004399028839543462 2023-01-22 20:11:00.283643: step: 1420/530, loss: 0.00015647706459276378 2023-01-22 20:11:01.375525: step: 1424/530, loss: 0.002332886680960655 2023-01-22 20:11:02.461555: step: 1428/530, loss: 0.00021565385395660996 2023-01-22 20:11:03.540899: step: 1432/530, loss: 0.007475203834474087 2023-01-22 20:11:04.643384: step: 1436/530, loss: 0.0044013927690684795 2023-01-22 20:11:05.726547: step: 1440/530, loss: 4.1806215449469164e-05 2023-01-22 20:11:06.821617: step: 1444/530, loss: 0.0011703333584591746 2023-01-22 20:11:07.912122: step: 1448/530, loss: 0.0015794051578268409 2023-01-22 20:11:09.013250: step: 1452/530, loss: 0.00033551757223904133 2023-01-22 20:11:10.120993: step: 1456/530, loss: 9.213612793246284e-05 2023-01-22 20:11:11.201521: step: 1460/530, loss: 0.012634302489459515 2023-01-22 20:11:12.294128: step: 1464/530, loss: 0.005126113537698984 2023-01-22 20:11:13.395401: step: 1468/530, loss: 9.689124271972105e-05 2023-01-22 20:11:14.485680: step: 1472/530, loss: 0.0019329937640577555 2023-01-22 20:11:15.551557: step: 1476/530, loss: 0.008387736976146698 2023-01-22 20:11:16.631647: step: 1480/530, loss: 0.0017540312837809324 2023-01-22 20:11:17.720996: step: 1484/530, loss: 0.0008437251090072095 2023-01-22 20:11:18.803918: step: 1488/530, loss: 0.003939060959964991 2023-01-22 20:11:19.875260: step: 1492/530, loss: 0.0045392257161438465 2023-01-22 20:11:20.976776: step: 1496/530, loss: 0.008384022861719131 2023-01-22 20:11:22.068007: step: 1500/530, loss: 0.00045957029215060174 2023-01-22 20:11:23.148183: step: 1504/530, loss: 9.275861521018669e-05 2023-01-22 20:11:24.233713: step: 1508/530, loss: 0.00700340885668993 2023-01-22 20:11:25.328047: step: 1512/530, loss: 0.0007242744322866201 2023-01-22 20:11:26.397268: step: 1516/530, loss: 0.0008526495075784624 2023-01-22 20:11:27.486693: step: 1520/530, loss: 0.006042341701686382 2023-01-22 20:11:28.604858: step: 1524/530, loss: 0.016548385843634605 2023-01-22 20:11:29.717367: step: 1528/530, loss: 0.00233745900914073 2023-01-22 20:11:30.793746: step: 1532/530, loss: 0.0005690492107532918 2023-01-22 20:11:31.879653: step: 1536/530, loss: 0.00019722001161426306 2023-01-22 20:11:32.971342: step: 1540/530, loss: 0.005244697909802198 2023-01-22 20:11:34.054809: step: 1544/530, loss: 0.0006843619630672038 2023-01-22 20:11:35.156248: step: 1548/530, loss: 0.0026567126624286175 2023-01-22 20:11:36.244104: step: 1552/530, loss: 0.007519073318690062 2023-01-22 20:11:37.321394: step: 1556/530, loss: 0.0020052820909768343 2023-01-22 20:11:38.448363: step: 1560/530, loss: 1.000175871013198e-06 2023-01-22 20:11:39.526318: step: 1564/530, loss: 0.0036371080204844475 2023-01-22 20:11:40.637479: step: 1568/530, loss: 0.0001614685170352459 2023-01-22 20:11:41.746072: step: 1572/530, loss: 0.003568487474694848 2023-01-22 20:11:42.817844: step: 1576/530, loss: 0.0001279938587686047 2023-01-22 20:11:43.933846: step: 1580/530, loss: 0.005685790907591581 2023-01-22 20:11:45.015216: step: 1584/530, loss: 0.00011141136201331392 2023-01-22 20:11:46.097276: step: 1588/530, loss: 0.0003209089918527752 2023-01-22 20:11:47.205522: step: 1592/530, loss: 0.00011579424608498812 2023-01-22 20:11:48.298649: step: 1596/530, loss: 0.005333163775503635 2023-01-22 20:11:49.387944: step: 1600/530, loss: 0.0013128520222380757 2023-01-22 20:11:50.496611: step: 1604/530, loss: 0.0004314040415920317 2023-01-22 20:11:51.600622: step: 1608/530, loss: 0.0031901539769023657 2023-01-22 20:11:52.710278: step: 1612/530, loss: 0.0036830303724855185 2023-01-22 20:11:53.792977: step: 1616/530, loss: 0.00030810883617959917 2023-01-22 20:11:54.881972: step: 1620/530, loss: 0.0025271351914852858 2023-01-22 20:11:55.979678: step: 1624/530, loss: 0.00015104500926099718 2023-01-22 20:11:57.053816: step: 1628/530, loss: 0.0009225932881236076 2023-01-22 20:11:58.134813: step: 1632/530, loss: 0.006921342574059963 2023-01-22 20:11:59.226037: step: 1636/530, loss: 0.012433944270014763 2023-01-22 20:12:00.304708: step: 1640/530, loss: 0.002472271677106619 2023-01-22 20:12:01.401146: step: 1644/530, loss: 0.01649395376443863 2023-01-22 20:12:02.477475: step: 1648/530, loss: 0.0005079595721326768 2023-01-22 20:12:03.554321: step: 1652/530, loss: 0.001471898751333356 2023-01-22 20:12:04.627602: step: 1656/530, loss: 0.0005140473367646337 2023-01-22 20:12:05.699470: step: 1660/530, loss: 7.484033267246559e-05 2023-01-22 20:12:06.768388: step: 1664/530, loss: 0.006606653332710266 2023-01-22 20:12:07.864278: step: 1668/530, loss: 0.0032492068130522966 2023-01-22 20:12:08.942763: step: 1672/530, loss: 7.73825649957871e-06 2023-01-22 20:12:10.040431: step: 1676/530, loss: 0.014332698658108711 2023-01-22 20:12:11.123122: step: 1680/530, loss: 0.015233784914016724 2023-01-22 20:12:12.207802: step: 1684/530, loss: 0.010254183784127235 2023-01-22 20:12:13.271011: step: 1688/530, loss: 0.00034514759317971766 2023-01-22 20:12:14.367935: step: 1692/530, loss: 0.00027492354274727404 2023-01-22 20:12:15.447137: step: 1696/530, loss: 0.0005268744425848126 2023-01-22 20:12:16.541522: step: 1700/530, loss: 3.061047027586028e-05 2023-01-22 20:12:17.633649: step: 1704/530, loss: 0.004546803887933493 2023-01-22 20:12:18.719996: step: 1708/530, loss: 0.0007081169751472771 2023-01-22 20:12:19.795345: step: 1712/530, loss: 0.000974190654233098 2023-01-22 20:12:20.884084: step: 1716/530, loss: 0.002233486855402589 2023-01-22 20:12:21.969186: step: 1720/530, loss: 0.00027596502332016826 2023-01-22 20:12:23.057582: step: 1724/530, loss: 0.0012686955742537975 2023-01-22 20:12:24.167596: step: 1728/530, loss: 0.011882033199071884 2023-01-22 20:12:25.273313: step: 1732/530, loss: 0.0016740866703912616 2023-01-22 20:12:26.380348: step: 1736/530, loss: 0.0036670188419520855 2023-01-22 20:12:27.467981: step: 1740/530, loss: 0.0006247829296626151 2023-01-22 20:12:28.561668: step: 1744/530, loss: 0.0002302930224686861 2023-01-22 20:12:29.639591: step: 1748/530, loss: 0.004521691240370274 2023-01-22 20:12:30.720841: step: 1752/530, loss: 6.992492853896692e-05 2023-01-22 20:12:31.810558: step: 1756/530, loss: 0.0025664132554084063 2023-01-22 20:12:32.894062: step: 1760/530, loss: 0.0001788092777132988 2023-01-22 20:12:33.986214: step: 1764/530, loss: 0.0027129855006933212 2023-01-22 20:12:35.075190: step: 1768/530, loss: 0.0022424794733524323 2023-01-22 20:12:36.160542: step: 1772/530, loss: 0.014447060413658619 2023-01-22 20:12:37.250657: step: 1776/530, loss: 0.015384789556264877 2023-01-22 20:12:38.365279: step: 1780/530, loss: 0.0037047071382403374 2023-01-22 20:12:39.468449: step: 1784/530, loss: 0.0019358344143256545 2023-01-22 20:12:40.535434: step: 1788/530, loss: 0.0011915653012692928 2023-01-22 20:12:41.628543: step: 1792/530, loss: 0.0050245351158082485 2023-01-22 20:12:42.707450: step: 1796/530, loss: 0.0036216562148183584 2023-01-22 20:12:43.778140: step: 1800/530, loss: 0.00040984529186971486 2023-01-22 20:12:44.864199: step: 1804/530, loss: 0.003871543100103736 2023-01-22 20:12:45.959654: step: 1808/530, loss: 0.001043385243974626 2023-01-22 20:12:47.020050: step: 1812/530, loss: 0.0014169103233143687 2023-01-22 20:12:48.106263: step: 1816/530, loss: 0.0010335597908124328 2023-01-22 20:12:49.202786: step: 1820/530, loss: 0.00853751227259636 2023-01-22 20:12:50.289509: step: 1824/530, loss: 0.001902538351714611 2023-01-22 20:12:51.393939: step: 1828/530, loss: 0.005769925657659769 2023-01-22 20:12:52.470049: step: 1832/530, loss: 0.00010788224608404562 2023-01-22 20:12:53.551281: step: 1836/530, loss: 0.0002556719118729234 2023-01-22 20:12:54.629293: step: 1840/530, loss: 0.0023373058065772057 2023-01-22 20:12:55.717937: step: 1844/530, loss: 0.0018819218967109919 2023-01-22 20:12:56.830940: step: 1848/530, loss: 0.0053341928869485855 2023-01-22 20:12:57.907831: step: 1852/530, loss: 0.0010817032307386398 2023-01-22 20:12:58.996543: step: 1856/530, loss: 0.004029288422316313 2023-01-22 20:13:00.091588: step: 1860/530, loss: 0.0005967693869024515 2023-01-22 20:13:01.167720: step: 1864/530, loss: 0.012114092707633972 2023-01-22 20:13:02.246224: step: 1868/530, loss: 0.00201412639580667 2023-01-22 20:13:03.322194: step: 1872/530, loss: 0.0019678636454045773 2023-01-22 20:13:04.386287: step: 1876/530, loss: 0.004111373797059059 2023-01-22 20:13:05.467189: step: 1880/530, loss: 0.007007824257016182 2023-01-22 20:13:06.541042: step: 1884/530, loss: 0.00036227283999323845 2023-01-22 20:13:07.629368: step: 1888/530, loss: 0.004348426591604948 2023-01-22 20:13:08.689524: step: 1892/530, loss: 0.001902793999761343 2023-01-22 20:13:09.793596: step: 1896/530, loss: 0.0016491325804963708 2023-01-22 20:13:10.849098: step: 1900/530, loss: 0.003511815331876278 2023-01-22 20:13:11.927166: step: 1904/530, loss: 0.002622359897941351 2023-01-22 20:13:13.016856: step: 1908/530, loss: 0.0013616224750876427 2023-01-22 20:13:14.095479: step: 1912/530, loss: 0.0017233459511771798 2023-01-22 20:13:15.189572: step: 1916/530, loss: 0.01039955485612154 2023-01-22 20:13:16.267550: step: 1920/530, loss: 0.003541199490427971 2023-01-22 20:13:17.354021: step: 1924/530, loss: 0.004119502380490303 2023-01-22 20:13:18.429305: step: 1928/530, loss: 0.00024195419973693788 2023-01-22 20:13:19.500016: step: 1932/530, loss: 0.01525817159563303 2023-01-22 20:13:20.571982: step: 1936/530, loss: 0.00019643902487587184 2023-01-22 20:13:21.667030: step: 1940/530, loss: 0.0038997665978968143 2023-01-22 20:13:22.737802: step: 1944/530, loss: 0.00576160941272974 2023-01-22 20:13:23.796958: step: 1948/530, loss: 5.638922448270023e-05 2023-01-22 20:13:24.893010: step: 1952/530, loss: 0.007332270033657551 2023-01-22 20:13:25.986109: step: 1956/530, loss: 0.001038927468471229 2023-01-22 20:13:27.091645: step: 1960/530, loss: 0.0007676129462197423 2023-01-22 20:13:28.178792: step: 1964/530, loss: 0.0017081722617149353 2023-01-22 20:13:29.256815: step: 1968/530, loss: 0.001446377718821168 2023-01-22 20:13:30.325649: step: 1972/530, loss: 7.40698233130388e-05 2023-01-22 20:13:31.430134: step: 1976/530, loss: 0.015186567790806293 2023-01-22 20:13:32.532393: step: 1980/530, loss: 0.004140587989240885 2023-01-22 20:13:33.612327: step: 1984/530, loss: 0.0013683964498341084 2023-01-22 20:13:34.704641: step: 1988/530, loss: 0.004019567742943764 2023-01-22 20:13:35.780427: step: 1992/530, loss: 0.00021876940445508808 2023-01-22 20:13:36.893654: step: 1996/530, loss: 0.0026058435905724764 2023-01-22 20:13:37.973465: step: 2000/530, loss: 3.5194450902054086e-05 2023-01-22 20:13:39.053489: step: 2004/530, loss: 0.0012629564153030515 2023-01-22 20:13:40.148846: step: 2008/530, loss: 0.003418681211769581 2023-01-22 20:13:41.229805: step: 2012/530, loss: 0.00518101267516613 2023-01-22 20:13:42.311270: step: 2016/530, loss: 0.001349366852082312 2023-01-22 20:13:43.399295: step: 2020/530, loss: 0.0004321894666645676 2023-01-22 20:13:44.475106: step: 2024/530, loss: 0.0030992792453616858 2023-01-22 20:13:45.573716: step: 2028/530, loss: 0.003331840503960848 2023-01-22 20:13:46.659764: step: 2032/530, loss: 0.000894597265869379 2023-01-22 20:13:47.722789: step: 2036/530, loss: 0.007164007984101772 2023-01-22 20:13:48.809888: step: 2040/530, loss: 0.009799154475331306 2023-01-22 20:13:49.901397: step: 2044/530, loss: 0.0047544799745082855 2023-01-22 20:13:51.014815: step: 2048/530, loss: 0.007946967147290707 2023-01-22 20:13:52.089437: step: 2052/530, loss: 0.0020527716260403395 2023-01-22 20:13:53.167627: step: 2056/530, loss: 0.0022000509779900312 2023-01-22 20:13:54.245396: step: 2060/530, loss: 5.367500762076816e-06 2023-01-22 20:13:55.333082: step: 2064/530, loss: 0.0034030878450721502 2023-01-22 20:13:56.415482: step: 2068/530, loss: 0.011891954578459263 2023-01-22 20:13:57.504405: step: 2072/530, loss: 0.0049121929332613945 2023-01-22 20:13:58.585615: step: 2076/530, loss: 0.00882336962968111 2023-01-22 20:13:59.658819: step: 2080/530, loss: 0.0031558808404952288 2023-01-22 20:14:00.740289: step: 2084/530, loss: 0.006491594482213259 2023-01-22 20:14:01.838418: step: 2088/530, loss: 0.0003341978008393198 2023-01-22 20:14:02.938050: step: 2092/530, loss: 0.008969110436737537 2023-01-22 20:14:04.041925: step: 2096/530, loss: 0.0 2023-01-22 20:14:05.114560: step: 2100/530, loss: 0.00013284842134453356 2023-01-22 20:14:06.184850: step: 2104/530, loss: 0.00024358122027479112 2023-01-22 20:14:07.288605: step: 2108/530, loss: 0.0021814615465700626 2023-01-22 20:14:08.378487: step: 2112/530, loss: 0.01966274343430996 2023-01-22 20:14:09.465781: step: 2116/530, loss: 0.006108695175498724 2023-01-22 20:14:10.548607: step: 2120/530, loss: 5.6259759730892256e-05 ================================================== Loss: 0.004 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3383751927029805, 'r': 0.3569954594741122, 'f1': 0.34743602427120435}, 'combined': 0.2560054915682558, 'stategy': 1, 'epoch': 15} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33633573932523514, 'r': 0.2907590862218155, 'f1': 0.31189117896048324}, 'combined': 0.19370083745966854, 'stategy': 1, 'epoch': 15} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34571716045783474, 'r': 0.3417811017049941, 'f1': 0.3437378637376563}, 'combined': 0.2532805311751152, 'stategy': 1, 'epoch': 15} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.319360688989712, 'r': 0.28808798057232177, 'f1': 0.30291934306668467}, 'combined': 0.18812885516773048, 'stategy': 1, 'epoch': 15} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3439301841882813, 'r': 0.3308778052817052, 'f1': 0.3372777628306743}, 'combined': 0.2485204568226021, 'stategy': 1, 'epoch': 15} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3495400277691648, 'r': 0.2988170424956533, 'f1': 0.3221944268739721}, 'combined': 0.2000996966901511, 'stategy': 1, 'epoch': 15} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 15} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.38636363636363635, 'r': 0.5543478260869565, 'f1': 0.4553571428571429}, 'combined': 0.22767857142857145, 'stategy': 1, 'epoch': 15} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 15} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 16 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 20:16:40.536916: step: 4/530, loss: 0.002954723546281457 2023-01-22 20:16:41.604519: step: 8/530, loss: 0.00044845815864391625 2023-01-22 20:16:42.696085: step: 12/530, loss: 0.0005227226647548378 2023-01-22 20:16:43.783381: step: 16/530, loss: 2.8173930331831798e-05 2023-01-22 20:16:44.856205: step: 20/530, loss: 0.0005631744861602783 2023-01-22 20:16:45.951889: step: 24/530, loss: 0.007691206876188517 2023-01-22 20:16:47.056065: step: 28/530, loss: 0.0017431259620934725 2023-01-22 20:16:48.134879: step: 32/530, loss: 0.0006445638136938214 2023-01-22 20:16:49.211029: step: 36/530, loss: 0.0014654003316536546 2023-01-22 20:16:50.290036: step: 40/530, loss: 0.00032433445448987186 2023-01-22 20:16:51.377470: step: 44/530, loss: 0.0045589879155159 2023-01-22 20:16:52.474164: step: 48/530, loss: 0.004568952135741711 2023-01-22 20:16:53.549502: step: 52/530, loss: 0.0020693992264568806 2023-01-22 20:16:54.619560: step: 56/530, loss: 0.00017161820142064244 2023-01-22 20:16:55.688258: step: 60/530, loss: 0.001358807203359902 2023-01-22 20:16:56.785632: step: 64/530, loss: 0.001410193624906242 2023-01-22 20:16:57.867492: step: 68/530, loss: 0.00045735028106719255 2023-01-22 20:16:58.947150: step: 72/530, loss: 0.0002586637856438756 2023-01-22 20:17:00.037045: step: 76/530, loss: 0.000398591801058501 2023-01-22 20:17:01.129796: step: 80/530, loss: 0.02035372145473957 2023-01-22 20:17:02.212696: step: 84/530, loss: 0.013444044627249241 2023-01-22 20:17:03.307583: step: 88/530, loss: 3.883817043970339e-05 2023-01-22 20:17:04.403962: step: 92/530, loss: 0.007603918202221394 2023-01-22 20:17:05.486599: step: 96/530, loss: 0.0008910742471925914 2023-01-22 20:17:06.604660: step: 100/530, loss: 0.0016997241182252765 2023-01-22 20:17:07.696669: step: 104/530, loss: 0.001665754010900855 2023-01-22 20:17:08.760764: step: 108/530, loss: 0.0003134464204777032 2023-01-22 20:17:09.863698: step: 112/530, loss: 0.005385173484683037 2023-01-22 20:17:10.930310: step: 116/530, loss: 0.0028875747229903936 2023-01-22 20:17:12.040346: step: 120/530, loss: 0.022701019421219826 2023-01-22 20:17:13.157072: step: 124/530, loss: 0.002913362579420209 2023-01-22 20:17:14.236606: step: 128/530, loss: 0.0007831230759620667 2023-01-22 20:17:15.324527: step: 132/530, loss: 0.0004321267770137638 2023-01-22 20:17:16.415096: step: 136/530, loss: 0.001030613319016993 2023-01-22 20:17:17.505465: step: 140/530, loss: 0.002651211805641651 2023-01-22 20:17:18.627476: step: 144/530, loss: 1.0803332450848302e-08 2023-01-22 20:17:19.699123: step: 148/530, loss: 0.004252434242516756 2023-01-22 20:17:20.773407: step: 152/530, loss: 0.005296775139868259 2023-01-22 20:17:21.863788: step: 156/530, loss: 0.00017949669563677162 2023-01-22 20:17:22.946538: step: 160/530, loss: 6.435580417019082e-06 2023-01-22 20:17:24.041528: step: 164/530, loss: 0.00034122608485631645 2023-01-22 20:17:25.123163: step: 168/530, loss: 0.0010028555989265442 2023-01-22 20:17:26.204424: step: 172/530, loss: 0.0027353032492101192 2023-01-22 20:17:27.285964: step: 176/530, loss: 0.00256900442764163 2023-01-22 20:17:28.375580: step: 180/530, loss: 0.01153743639588356 2023-01-22 20:17:29.440237: step: 184/530, loss: 0.0011792861623689532 2023-01-22 20:17:30.522217: step: 188/530, loss: 0.0007198047824203968 2023-01-22 20:17:31.619816: step: 192/530, loss: 0.006728826556354761 2023-01-22 20:17:32.704780: step: 196/530, loss: 0.0003828633052762598 2023-01-22 20:17:33.778127: step: 200/530, loss: 0.002646331675350666 2023-01-22 20:17:34.858809: step: 204/530, loss: 0.001077571650967002 2023-01-22 20:17:35.945201: step: 208/530, loss: 0.000652323302347213 2023-01-22 20:17:37.065633: step: 212/530, loss: 0.0030014568474143744 2023-01-22 20:17:38.185957: step: 216/530, loss: 0.003260666271671653 2023-01-22 20:17:39.280235: step: 220/530, loss: 0.001680352259427309 2023-01-22 20:17:40.369162: step: 224/530, loss: 0.0008825248805806041 2023-01-22 20:17:41.431583: step: 228/530, loss: 0.0011361065553501248 2023-01-22 20:17:42.537912: step: 232/530, loss: 0.005784417502582073 2023-01-22 20:17:43.611209: step: 236/530, loss: 0.007462788838893175 2023-01-22 20:17:44.698618: step: 240/530, loss: 0.0007599100354127586 2023-01-22 20:17:45.797965: step: 244/530, loss: 0.004313374403864145 2023-01-22 20:17:46.862651: step: 248/530, loss: 6.927909453224856e-06 2023-01-22 20:17:47.967725: step: 252/530, loss: 0.0004326468624640256 2023-01-22 20:17:49.053203: step: 256/530, loss: 0.008995186537504196 2023-01-22 20:17:50.148681: step: 260/530, loss: 0.00029355150763876736 2023-01-22 20:17:51.249525: step: 264/530, loss: 0.00486218836158514 2023-01-22 20:17:52.326616: step: 268/530, loss: 0.0048637669533491135 2023-01-22 20:17:53.402071: step: 272/530, loss: 0.0021844892762601376 2023-01-22 20:17:54.500347: step: 276/530, loss: 0.002423346508294344 2023-01-22 20:17:55.588565: step: 280/530, loss: 0.0022170129232108593 2023-01-22 20:17:56.687407: step: 284/530, loss: 0.0038028659764677286 2023-01-22 20:17:57.777942: step: 288/530, loss: 0.00030519781284965575 2023-01-22 20:17:58.839392: step: 292/530, loss: 0.0012181508354842663 2023-01-22 20:17:59.938720: step: 296/530, loss: 0.0001642900169827044 2023-01-22 20:18:01.029648: step: 300/530, loss: 0.0016337765846401453 2023-01-22 20:18:02.118332: step: 304/530, loss: 2.640813727339264e-05 2023-01-22 20:18:03.216070: step: 308/530, loss: 0.005103096831589937 2023-01-22 20:18:04.309433: step: 312/530, loss: 4.338818325777538e-05 2023-01-22 20:18:05.392978: step: 316/530, loss: 0.007284747902303934 2023-01-22 20:18:06.477276: step: 320/530, loss: 0.01187017373740673 2023-01-22 20:18:07.566751: step: 324/530, loss: 0.003390074707567692 2023-01-22 20:18:08.675932: step: 328/530, loss: 0.007587057538330555 2023-01-22 20:18:09.752619: step: 332/530, loss: 0.005341880023479462 2023-01-22 20:18:10.830805: step: 336/530, loss: 0.0011350206332281232 2023-01-22 20:18:11.920617: step: 340/530, loss: 0.0025320881977677345 2023-01-22 20:18:13.039853: step: 344/530, loss: 0.0008874781779013574 2023-01-22 20:18:14.132730: step: 348/530, loss: 0.002052400493994355 2023-01-22 20:18:15.216336: step: 352/530, loss: 0.0024771452881395817 2023-01-22 20:18:16.325824: step: 356/530, loss: 0.00033059160341508687 2023-01-22 20:18:17.401794: step: 360/530, loss: 0.00028168834978714585 2023-01-22 20:18:18.473075: step: 364/530, loss: 0.0006801236886531115 2023-01-22 20:18:19.570276: step: 368/530, loss: 0.006793640088289976 2023-01-22 20:18:20.665045: step: 372/530, loss: 1.2780573342752177e-05 2023-01-22 20:18:21.749470: step: 376/530, loss: 0.0005107701290398836 2023-01-22 20:18:22.812621: step: 380/530, loss: 0.00029774016002193093 2023-01-22 20:18:23.890070: step: 384/530, loss: 0.00011703440395649523 2023-01-22 20:18:24.967522: step: 388/530, loss: 2.059024882328231e-05 2023-01-22 20:18:26.045218: step: 392/530, loss: 0.0007314326358027756 2023-01-22 20:18:27.124817: step: 396/530, loss: 0.0009269976289942861 2023-01-22 20:18:28.208266: step: 400/530, loss: 0.0008016666979528964 2023-01-22 20:18:29.284871: step: 404/530, loss: 0.00016452903219033033 2023-01-22 20:18:30.369539: step: 408/530, loss: 0.005205125547945499 2023-01-22 20:18:31.469890: step: 412/530, loss: 0.0025602970272302628 2023-01-22 20:18:32.548348: step: 416/530, loss: 0.0008605541661381721 2023-01-22 20:18:33.639918: step: 420/530, loss: 3.0510685974149965e-05 2023-01-22 20:18:34.722295: step: 424/530, loss: 0.006701792124658823 2023-01-22 20:18:35.810784: step: 428/530, loss: 0.0014641211600974202 2023-01-22 20:18:36.925128: step: 432/530, loss: 1.4339184417622164e-05 2023-01-22 20:18:38.021031: step: 436/530, loss: 0.0010109801078215241 2023-01-22 20:18:39.102882: step: 440/530, loss: 0.0006940175080671906 2023-01-22 20:18:40.187765: step: 444/530, loss: 0.00990916509181261 2023-01-22 20:18:41.280888: step: 448/530, loss: 0.0008067302405834198 2023-01-22 20:18:42.375891: step: 452/530, loss: 0.004962479695677757 2023-01-22 20:18:43.461388: step: 456/530, loss: 0.0002970180648844689 2023-01-22 20:18:44.537344: step: 460/530, loss: 0.009171870537102222 2023-01-22 20:18:45.635887: step: 464/530, loss: 0.00016788435459602624 2023-01-22 20:18:46.747857: step: 468/530, loss: 0.005036230199038982 2023-01-22 20:18:47.872096: step: 472/530, loss: 0.003540154080837965 2023-01-22 20:18:48.964394: step: 476/530, loss: 0.009947326965630054 2023-01-22 20:18:50.042859: step: 480/530, loss: 9.142982889898121e-06 2023-01-22 20:18:51.121365: step: 484/530, loss: 0.01023060828447342 2023-01-22 20:18:52.193570: step: 488/530, loss: 0.001469960785470903 2023-01-22 20:18:53.268065: step: 492/530, loss: 0.000816535553894937 2023-01-22 20:18:54.364058: step: 496/530, loss: 0.006719451863318682 2023-01-22 20:18:55.444422: step: 500/530, loss: 0.0034260135143995285 2023-01-22 20:18:56.526041: step: 504/530, loss: 0.0031876498833298683 2023-01-22 20:18:57.632806: step: 508/530, loss: 0.0005767729016952217 2023-01-22 20:18:58.717640: step: 512/530, loss: 0.0016765849431976676 2023-01-22 20:18:59.796071: step: 516/530, loss: 0.00012110883835703135 2023-01-22 20:19:00.906873: step: 520/530, loss: 0.0004973490140400827 2023-01-22 20:19:01.960355: step: 524/530, loss: 0.00018373607599642128 2023-01-22 20:19:03.053494: step: 528/530, loss: 0.004958410281687975 2023-01-22 20:19:04.139444: step: 532/530, loss: 0.0017065670108422637 2023-01-22 20:19:05.228070: step: 536/530, loss: 0.0040092021226882935 2023-01-22 20:19:06.302588: step: 540/530, loss: 0.03397200256586075 2023-01-22 20:19:07.385467: step: 544/530, loss: 0.0008486725273542106 2023-01-22 20:19:08.466306: step: 548/530, loss: 2.9967008231324144e-05 2023-01-22 20:19:09.557851: step: 552/530, loss: 0.0010432637063786387 2023-01-22 20:19:10.655708: step: 556/530, loss: 0.0027807482983917 2023-01-22 20:19:11.740067: step: 560/530, loss: 6.872442463645712e-05 2023-01-22 20:19:12.834773: step: 564/530, loss: 0.0013290123315528035 2023-01-22 20:19:13.905741: step: 568/530, loss: 0.006641450338065624 2023-01-22 20:19:14.994043: step: 572/530, loss: 0.003023469587787986 2023-01-22 20:19:16.087773: step: 576/530, loss: 0.002972981659695506 2023-01-22 20:19:17.184100: step: 580/530, loss: 3.284886770416051e-05 2023-01-22 20:19:18.272031: step: 584/530, loss: 0.0031865399796515703 2023-01-22 20:19:19.365427: step: 588/530, loss: 0.007889127358794212 2023-01-22 20:19:20.448184: step: 592/530, loss: 0.0038619008846580982 2023-01-22 20:19:21.506473: step: 596/530, loss: 0.0009821607964113355 2023-01-22 20:19:22.600157: step: 600/530, loss: 6.619410851271823e-05 2023-01-22 20:19:23.680181: step: 604/530, loss: 0.002822831505909562 2023-01-22 20:19:24.773928: step: 608/530, loss: 0.005496440455317497 2023-01-22 20:19:25.856331: step: 612/530, loss: 0.009657280519604683 2023-01-22 20:19:26.950003: step: 616/530, loss: 0.0016709959600120783 2023-01-22 20:19:28.053049: step: 620/530, loss: 0.0014983081491664052 2023-01-22 20:19:29.140385: step: 624/530, loss: 0.004068445414304733 2023-01-22 20:19:30.226086: step: 628/530, loss: 8.508070550306002e-07 2023-01-22 20:19:31.323334: step: 632/530, loss: 5.519353726413101e-05 2023-01-22 20:19:32.411366: step: 636/530, loss: 0.0001397411251673475 2023-01-22 20:19:33.498851: step: 640/530, loss: 0.0014539090916514397 2023-01-22 20:19:34.591602: step: 644/530, loss: 3.7332079955376685e-05 2023-01-22 20:19:35.662412: step: 648/530, loss: 0.00031373254023492336 2023-01-22 20:19:36.766077: step: 652/530, loss: 0.0017929950263351202 2023-01-22 20:19:37.847724: step: 656/530, loss: 1.528276357021241e-06 2023-01-22 20:19:38.955463: step: 660/530, loss: 1.6391229706869126e-08 2023-01-22 20:19:40.032396: step: 664/530, loss: 2.3388469344354235e-05 2023-01-22 20:19:41.110070: step: 668/530, loss: 0.0 2023-01-22 20:19:42.205327: step: 672/530, loss: 0.005200324580073357 2023-01-22 20:19:43.270630: step: 676/530, loss: 4.359983722679317e-05 2023-01-22 20:19:44.357325: step: 680/530, loss: 1.058614429894078e-06 2023-01-22 20:19:45.440040: step: 684/530, loss: 1.3914585679231095e-06 2023-01-22 20:19:46.522179: step: 688/530, loss: 0.001755238277837634 2023-01-22 20:19:47.605516: step: 692/530, loss: 5.841856818733504e-06 2023-01-22 20:19:48.694712: step: 696/530, loss: 0.00015238371270243078 2023-01-22 20:19:49.777334: step: 700/530, loss: 0.0034832616802304983 2023-01-22 20:19:50.876458: step: 704/530, loss: 0.0026851161383092403 2023-01-22 20:19:51.951031: step: 708/530, loss: 0.00034477890585549176 2023-01-22 20:19:53.031762: step: 712/530, loss: 0.0001400583132635802 2023-01-22 20:19:54.116035: step: 716/530, loss: 0.000933889125008136 2023-01-22 20:19:55.192204: step: 720/530, loss: 0.0009453259408473969 2023-01-22 20:19:56.296337: step: 724/530, loss: 0.0011413487372919917 2023-01-22 20:19:57.401082: step: 728/530, loss: 0.006688188295811415 2023-01-22 20:19:58.515475: step: 732/530, loss: 0.003394009545445442 2023-01-22 20:19:59.610178: step: 736/530, loss: 0.0033763854298740625 2023-01-22 20:20:00.722553: step: 740/530, loss: 0.0028470607940107584 2023-01-22 20:20:01.809260: step: 744/530, loss: 0.0010789900552481413 2023-01-22 20:20:02.927249: step: 748/530, loss: 0.0006434411625377834 2023-01-22 20:20:04.017457: step: 752/530, loss: 0.0030373719055205584 2023-01-22 20:20:05.094001: step: 756/530, loss: 0.0013517733896151185 2023-01-22 20:20:06.176519: step: 760/530, loss: 0.0007551456801593304 2023-01-22 20:20:07.275072: step: 764/530, loss: 0.011850315146148205 2023-01-22 20:20:08.362983: step: 768/530, loss: 0.0019961909856647253 2023-01-22 20:20:09.457071: step: 772/530, loss: 0.0007041761418804526 2023-01-22 20:20:10.559542: step: 776/530, loss: 0.00309159979224205 2023-01-22 20:20:11.662310: step: 780/530, loss: 0.0011339497286826372 2023-01-22 20:20:12.763764: step: 784/530, loss: 6.161235432955436e-06 2023-01-22 20:20:13.859244: step: 788/530, loss: 0.0005244814674369991 2023-01-22 20:20:14.945712: step: 792/530, loss: 0.005705093964934349 2023-01-22 20:20:16.016121: step: 796/530, loss: 0.0037209982983767986 2023-01-22 20:20:17.093508: step: 800/530, loss: 5.357477493816987e-05 2023-01-22 20:20:18.177700: step: 804/530, loss: 0.007990230806171894 2023-01-22 20:20:19.253534: step: 808/530, loss: 0.0004635354853235185 2023-01-22 20:20:20.349104: step: 812/530, loss: 0.002716107526794076 2023-01-22 20:20:21.418067: step: 816/530, loss: 0.005373099353164434 2023-01-22 20:20:22.523353: step: 820/530, loss: 0.0042391931638121605 2023-01-22 20:20:23.585865: step: 824/530, loss: 0.0003886620106641203 2023-01-22 20:20:24.697996: step: 828/530, loss: 0.0003630721475929022 2023-01-22 20:20:25.780485: step: 832/530, loss: 0.0016245156293734908 2023-01-22 20:20:26.857279: step: 836/530, loss: 0.0016663596034049988 2023-01-22 20:20:27.950114: step: 840/530, loss: 4.6407927584368736e-05 2023-01-22 20:20:29.049068: step: 844/530, loss: 0.03343836963176727 2023-01-22 20:20:30.130577: step: 848/530, loss: 0.0015235901810228825 2023-01-22 20:20:31.220791: step: 852/530, loss: 2.3184093151940033e-05 2023-01-22 20:20:32.317974: step: 856/530, loss: 0.000152737382450141 2023-01-22 20:20:33.420903: step: 860/530, loss: 0.008834323845803738 2023-01-22 20:20:34.520926: step: 864/530, loss: 0.0021855863742530346 2023-01-22 20:20:35.604771: step: 868/530, loss: 1.8849797925213352e-05 2023-01-22 20:20:36.717663: step: 872/530, loss: 4.739106589113362e-05 2023-01-22 20:20:37.791827: step: 876/530, loss: 4.2123956518480554e-05 2023-01-22 20:20:38.889378: step: 880/530, loss: 0.00017269035743083805 2023-01-22 20:20:39.968256: step: 884/530, loss: 0.000481678667711094 2023-01-22 20:20:41.038406: step: 888/530, loss: 0.0017502587288618088 2023-01-22 20:20:42.135826: step: 892/530, loss: 0.010046809911727905 2023-01-22 20:20:43.223514: step: 896/530, loss: 0.004912385251373053 2023-01-22 20:20:44.308812: step: 900/530, loss: 0.0021108752116560936 2023-01-22 20:20:45.376502: step: 904/530, loss: 0.00012018627603538334 2023-01-22 20:20:46.478413: step: 908/530, loss: 0.0019957348704338074 2023-01-22 20:20:47.555616: step: 912/530, loss: 0.0006939433515071869 2023-01-22 20:20:48.638217: step: 916/530, loss: 0.0043212249875068665 2023-01-22 20:20:49.746659: step: 920/530, loss: 0.006252510938793421 2023-01-22 20:20:50.830316: step: 924/530, loss: 0.0007723422022536397 2023-01-22 20:20:51.914471: step: 928/530, loss: 0.0011998937698081136 2023-01-22 20:20:52.987042: step: 932/530, loss: 0.006741023156791925 2023-01-22 20:20:54.068358: step: 936/530, loss: 3.805392043432221e-05 2023-01-22 20:20:55.162033: step: 940/530, loss: 0.00033521157456561923 2023-01-22 20:20:56.269978: step: 944/530, loss: 0.007296199444681406 2023-01-22 20:20:57.367135: step: 948/530, loss: 0.0022839608136564493 2023-01-22 20:20:58.438347: step: 952/530, loss: 0.0009386551682837307 2023-01-22 20:20:59.525162: step: 956/530, loss: 0.002275177976116538 2023-01-22 20:21:00.609085: step: 960/530, loss: 0.00646181171759963 2023-01-22 20:21:01.719061: step: 964/530, loss: 0.0026393351145088673 2023-01-22 20:21:02.788253: step: 968/530, loss: 0.0013786256313323975 2023-01-22 20:21:03.870277: step: 972/530, loss: 3.009774218298844e-06 2023-01-22 20:21:04.979390: step: 976/530, loss: 0.005927097983658314 2023-01-22 20:21:06.077167: step: 980/530, loss: 0.00010646599548636004 2023-01-22 20:21:07.156044: step: 984/530, loss: 0.0033073725644499063 2023-01-22 20:21:08.248513: step: 988/530, loss: 8.717246964806691e-05 2023-01-22 20:21:09.321157: step: 992/530, loss: 0.0015189225086942315 2023-01-22 20:21:10.403791: step: 996/530, loss: 0.0008218188886530697 2023-01-22 20:21:11.491241: step: 1000/530, loss: 0.01095456350594759 2023-01-22 20:21:12.564005: step: 1004/530, loss: 0.004398738499730825 2023-01-22 20:21:13.659721: step: 1008/530, loss: 0.004040711093693972 2023-01-22 20:21:14.742019: step: 1012/530, loss: 0.0013462050119414926 2023-01-22 20:21:15.828091: step: 1016/530, loss: 0.018077151849865913 2023-01-22 20:21:16.912772: step: 1020/530, loss: 0.0008204568293876946 2023-01-22 20:21:18.008508: step: 1024/530, loss: 0.008758884854614735 2023-01-22 20:21:19.096078: step: 1028/530, loss: 0.007381300907582045 2023-01-22 20:21:20.182339: step: 1032/530, loss: 0.0020989899057894945 2023-01-22 20:21:21.277032: step: 1036/530, loss: 0.005010779947042465 2023-01-22 20:21:22.357743: step: 1040/530, loss: 1.5025427273940295e-05 2023-01-22 20:21:23.441802: step: 1044/530, loss: 0.010882746428251266 2023-01-22 20:21:24.546732: step: 1048/530, loss: 0.0030730734579265118 2023-01-22 20:21:25.605778: step: 1052/530, loss: 1.9689518012455665e-05 2023-01-22 20:21:26.688973: step: 1056/530, loss: 1.5188254110398702e-05 2023-01-22 20:21:27.768645: step: 1060/530, loss: 0.0003083275514654815 2023-01-22 20:21:28.854234: step: 1064/530, loss: 0.005573458969593048 2023-01-22 20:21:29.963060: step: 1068/530, loss: 0.022893719375133514 2023-01-22 20:21:31.048206: step: 1072/530, loss: 0.0025528757832944393 2023-01-22 20:21:32.112694: step: 1076/530, loss: 0.00040614043246023357 2023-01-22 20:21:33.189648: step: 1080/530, loss: 0.0025634909979999065 2023-01-22 20:21:34.277845: step: 1084/530, loss: 0.0006221125368028879 2023-01-22 20:21:35.373071: step: 1088/530, loss: 0.006092137191444635 2023-01-22 20:21:36.451825: step: 1092/530, loss: 0.00023583446454722434 2023-01-22 20:21:37.532146: step: 1096/530, loss: 0.0018546071369200945 2023-01-22 20:21:38.632647: step: 1100/530, loss: 0.001455626799724996 2023-01-22 20:21:39.722701: step: 1104/530, loss: 0.0009344169520772994 2023-01-22 20:21:40.822389: step: 1108/530, loss: 0.001996472245082259 2023-01-22 20:21:41.911824: step: 1112/530, loss: 0.00409529497846961 2023-01-22 20:21:43.007373: step: 1116/530, loss: 0.011121563613414764 2023-01-22 20:21:44.097087: step: 1120/530, loss: 0.0013962743105366826 2023-01-22 20:21:45.192969: step: 1124/530, loss: 0.004220105707645416 2023-01-22 20:21:46.251752: step: 1128/530, loss: 0.0031265011057257652 2023-01-22 20:21:47.327666: step: 1132/530, loss: 0.006375927943736315 2023-01-22 20:21:48.401334: step: 1136/530, loss: 0.0009379417169839144 2023-01-22 20:21:49.458875: step: 1140/530, loss: 9.866567415883765e-05 2023-01-22 20:21:50.555225: step: 1144/530, loss: 0.0006635566824115813 2023-01-22 20:21:51.626538: step: 1148/530, loss: 0.003601459553465247 2023-01-22 20:21:52.691074: step: 1152/530, loss: 0.0013722165022045374 2023-01-22 20:21:53.764950: step: 1156/530, loss: 0.0333854965865612 2023-01-22 20:21:54.872200: step: 1160/530, loss: 0.0010874661384150386 2023-01-22 20:21:55.976283: step: 1164/530, loss: 0.00022803246974945068 2023-01-22 20:21:57.056788: step: 1168/530, loss: 5.935566605330678e-06 2023-01-22 20:21:58.142100: step: 1172/530, loss: 0.0023388874251395464 2023-01-22 20:21:59.229078: step: 1176/530, loss: 0.0008275939617305994 2023-01-22 20:22:00.325591: step: 1180/530, loss: 0.00235777092166245 2023-01-22 20:22:01.416253: step: 1184/530, loss: 0.003099546767771244 2023-01-22 20:22:02.500818: step: 1188/530, loss: 0.007683195639401674 2023-01-22 20:22:03.604271: step: 1192/530, loss: 0.01222831942141056 2023-01-22 20:22:04.700075: step: 1196/530, loss: 0.0015453894156962633 2023-01-22 20:22:05.782886: step: 1200/530, loss: 0.0022118159104138613 2023-01-22 20:22:06.865810: step: 1204/530, loss: 0.006718839053064585 2023-01-22 20:22:07.968258: step: 1208/530, loss: 0.002990497974678874 2023-01-22 20:22:09.051637: step: 1212/530, loss: 0.0012237633345648646 2023-01-22 20:22:10.142675: step: 1216/530, loss: 0.01069978903979063 2023-01-22 20:22:11.239815: step: 1220/530, loss: 0.0003575255977921188 2023-01-22 20:22:12.379917: step: 1224/530, loss: 0.0004864147340413183 2023-01-22 20:22:13.463475: step: 1228/530, loss: 0.0006158277974463999 2023-01-22 20:22:14.532346: step: 1232/530, loss: 0.008188759908080101 2023-01-22 20:22:15.616850: step: 1236/530, loss: 0.006146847270429134 2023-01-22 20:22:16.733807: step: 1240/530, loss: 0.0022965569514781237 2023-01-22 20:22:17.800678: step: 1244/530, loss: 0.001639484311453998 2023-01-22 20:22:18.873785: step: 1248/530, loss: 0.006271504797041416 2023-01-22 20:22:19.970923: step: 1252/530, loss: 0.0011681526666507125 2023-01-22 20:22:21.042130: step: 1256/530, loss: 0.007113034371286631 2023-01-22 20:22:22.147064: step: 1260/530, loss: 0.005143363960087299 2023-01-22 20:22:23.239243: step: 1264/530, loss: 0.0004639250983018428 2023-01-22 20:22:24.361034: step: 1268/530, loss: 0.0005338076734915376 2023-01-22 20:22:25.437644: step: 1272/530, loss: 8.12380385468714e-05 2023-01-22 20:22:26.534503: step: 1276/530, loss: 0.0009575830190442502 2023-01-22 20:22:27.618397: step: 1280/530, loss: 0.0010877613676711917 2023-01-22 20:22:28.707793: step: 1284/530, loss: 0.0023875616025179625 2023-01-22 20:22:29.791126: step: 1288/530, loss: 0.0004638465470634401 2023-01-22 20:22:30.889971: step: 1292/530, loss: 0.002524861367419362 2023-01-22 20:22:31.973040: step: 1296/530, loss: 7.034824375296012e-05 2023-01-22 20:22:33.063759: step: 1300/530, loss: 0.004284720867872238 2023-01-22 20:22:34.148823: step: 1304/530, loss: 0.012702934443950653 2023-01-22 20:22:35.237131: step: 1308/530, loss: 0.0013486533425748348 2023-01-22 20:22:36.301935: step: 1312/530, loss: 8.894842176232487e-05 2023-01-22 20:22:37.403562: step: 1316/530, loss: 0.004712602589279413 2023-01-22 20:22:38.471917: step: 1320/530, loss: 0.001283988356590271 2023-01-22 20:22:39.541808: step: 1324/530, loss: 2.7795958885690197e-05 2023-01-22 20:22:40.630182: step: 1328/530, loss: 0.0005046577425673604 2023-01-22 20:22:41.712834: step: 1332/530, loss: 0.0006284591509029269 2023-01-22 20:22:42.778225: step: 1336/530, loss: 0.003634740598499775 2023-01-22 20:22:43.864550: step: 1340/530, loss: 7.278336124727502e-05 2023-01-22 20:22:44.971064: step: 1344/530, loss: 0.0007392282132059336 2023-01-22 20:22:46.067272: step: 1348/530, loss: 0.000643865903839469 2023-01-22 20:22:47.126718: step: 1352/530, loss: 3.5265742326373584e-07 2023-01-22 20:22:48.199120: step: 1356/530, loss: 0.0022137747146189213 2023-01-22 20:22:49.298818: step: 1360/530, loss: 0.00041922854143194854 2023-01-22 20:22:50.378980: step: 1364/530, loss: 0.0040763677097857 2023-01-22 20:22:51.471278: step: 1368/530, loss: 0.009680839255452156 2023-01-22 20:22:52.556600: step: 1372/530, loss: 0.008086957037448883 2023-01-22 20:22:53.648057: step: 1376/530, loss: 0.004043171647936106 2023-01-22 20:22:54.722146: step: 1380/530, loss: 0.0018598099704831839 2023-01-22 20:22:55.811602: step: 1384/530, loss: 0.0006758856470696628 2023-01-22 20:22:56.920454: step: 1388/530, loss: 0.0037887301295995712 2023-01-22 20:22:57.989859: step: 1392/530, loss: 0.0052274675108492374 2023-01-22 20:22:59.085968: step: 1396/530, loss: 0.004116029478609562 2023-01-22 20:23:00.158732: step: 1400/530, loss: 9.88139581750147e-05 2023-01-22 20:23:01.236787: step: 1404/530, loss: 6.6203047026647255e-06 2023-01-22 20:23:02.317686: step: 1408/530, loss: 0.002617774996906519 2023-01-22 20:23:03.412009: step: 1412/530, loss: 0.001070051803253591 2023-01-22 20:23:04.490200: step: 1416/530, loss: 0.0008536711102351546 2023-01-22 20:23:05.553394: step: 1420/530, loss: 0.01228385791182518 2023-01-22 20:23:06.634242: step: 1424/530, loss: 0.0018940340960398316 2023-01-22 20:23:07.715498: step: 1428/530, loss: 6.663881504209712e-05 2023-01-22 20:23:08.803177: step: 1432/530, loss: 0.0033455672673881054 2023-01-22 20:23:09.875114: step: 1436/530, loss: 1.7605614630156197e-05 2023-01-22 20:23:10.971956: step: 1440/530, loss: 0.001410569646395743 2023-01-22 20:23:12.052217: step: 1444/530, loss: 0.006385213695466518 2023-01-22 20:23:13.110283: step: 1448/530, loss: 0.001963956281542778 2023-01-22 20:23:14.184608: step: 1452/530, loss: 0.0007068910053931177 2023-01-22 20:23:15.280083: step: 1456/530, loss: 0.0016609654994681478 2023-01-22 20:23:16.360276: step: 1460/530, loss: 0.002481671515852213 2023-01-22 20:23:17.462129: step: 1464/530, loss: 0.0023920934181660414 2023-01-22 20:23:18.532039: step: 1468/530, loss: 0.0003659272624645382 2023-01-22 20:23:19.598990: step: 1472/530, loss: 0.0005528698093257844 2023-01-22 20:23:20.675622: step: 1476/530, loss: 0.00032423148513771594 2023-01-22 20:23:21.754414: step: 1480/530, loss: 0.0002946548629552126 2023-01-22 20:23:22.829226: step: 1484/530, loss: 0.0008898377418518066 2023-01-22 20:23:23.898646: step: 1488/530, loss: 0.0024196216836571693 2023-01-22 20:23:24.994290: step: 1492/530, loss: 0.013456962071359158 2023-01-22 20:23:26.055257: step: 1496/530, loss: 0.0010293158702552319 2023-01-22 20:23:27.125793: step: 1500/530, loss: 0.0020077268127352 2023-01-22 20:23:28.200430: step: 1504/530, loss: 0.013075864873826504 2023-01-22 20:23:29.299815: step: 1508/530, loss: 5.658302325173281e-05 2023-01-22 20:23:30.388461: step: 1512/530, loss: 0.0009153262944892049 2023-01-22 20:23:31.488233: step: 1516/530, loss: 0.004963977262377739 2023-01-22 20:23:32.582911: step: 1520/530, loss: 0.0036875337827950716 2023-01-22 20:23:33.652509: step: 1524/530, loss: 0.002731300424784422 2023-01-22 20:23:34.729810: step: 1528/530, loss: 0.012656821869313717 2023-01-22 20:23:35.798854: step: 1532/530, loss: 0.0008387502748519182 2023-01-22 20:23:36.885421: step: 1536/530, loss: 0.0032218273263424635 2023-01-22 20:23:37.983592: step: 1540/530, loss: 0.00024911388754844666 2023-01-22 20:23:39.079046: step: 1544/530, loss: 0.023877687752246857 2023-01-22 20:23:40.155026: step: 1548/530, loss: 0.00823256280273199 2023-01-22 20:23:41.235855: step: 1552/530, loss: 0.02221542038023472 2023-01-22 20:23:42.337386: step: 1556/530, loss: 0.005809667985886335 2023-01-22 20:23:43.415153: step: 1560/530, loss: 0.0027239446062594652 2023-01-22 20:23:44.517920: step: 1564/530, loss: 0.022694837301969528 2023-01-22 20:23:45.602168: step: 1568/530, loss: 0.014259930700063705 2023-01-22 20:23:46.694201: step: 1572/530, loss: 0.00015027608606033027 2023-01-22 20:23:47.799544: step: 1576/530, loss: 0.005722373723983765 2023-01-22 20:23:48.873529: step: 1580/530, loss: 0.00357958790846169 2023-01-22 20:23:49.979982: step: 1584/530, loss: 0.0043758824467659 2023-01-22 20:23:51.066369: step: 1588/530, loss: 0.003674211213365197 2023-01-22 20:23:52.160107: step: 1592/530, loss: 2.4529456368327374e-06 2023-01-22 20:23:53.266132: step: 1596/530, loss: 0.0031450423412024975 2023-01-22 20:23:54.351844: step: 1600/530, loss: 0.003242489416152239 2023-01-22 20:23:55.467850: step: 1604/530, loss: 0.0006098906742408872 2023-01-22 20:23:56.574349: step: 1608/530, loss: 0.0019877140875905752 2023-01-22 20:23:57.653826: step: 1612/530, loss: 0.001345456694252789 2023-01-22 20:23:58.750701: step: 1616/530, loss: 0.002948288805782795 2023-01-22 20:23:59.818702: step: 1620/530, loss: 8.273212301901367e-07 2023-01-22 20:24:00.925484: step: 1624/530, loss: 0.0038146143779158592 2023-01-22 20:24:02.033216: step: 1628/530, loss: 0.00317201460711658 2023-01-22 20:24:03.114358: step: 1632/530, loss: 0.0015082353493198752 2023-01-22 20:24:04.212567: step: 1636/530, loss: 0.0003809299669228494 2023-01-22 20:24:05.298082: step: 1640/530, loss: 0.013876257464289665 2023-01-22 20:24:06.369139: step: 1644/530, loss: 0.00010343162284698337 2023-01-22 20:24:07.457811: step: 1648/530, loss: 0.0009813953656703234 2023-01-22 20:24:08.553615: step: 1652/530, loss: 2.960980054922402e-05 2023-01-22 20:24:09.651273: step: 1656/530, loss: 0.0052544656209647655 2023-01-22 20:24:10.737663: step: 1660/530, loss: 1.619407703401521e-05 2023-01-22 20:24:11.831183: step: 1664/530, loss: 0.001400230685248971 2023-01-22 20:24:12.931937: step: 1668/530, loss: 0.0016509218839928508 2023-01-22 20:24:14.011815: step: 1672/530, loss: 0.001079654903151095 2023-01-22 20:24:15.110188: step: 1676/530, loss: 0.004524801392108202 2023-01-22 20:24:16.183746: step: 1680/530, loss: 0.0010629636235535145 2023-01-22 20:24:17.268890: step: 1684/530, loss: 0.00010164112609345466 2023-01-22 20:24:18.364143: step: 1688/530, loss: 0.00247724587097764 2023-01-22 20:24:19.446753: step: 1692/530, loss: 0.005047983024269342 2023-01-22 20:24:20.519846: step: 1696/530, loss: 0.0013642992125824094 2023-01-22 20:24:21.597808: step: 1700/530, loss: 0.0004914554883725941 2023-01-22 20:24:22.727944: step: 1704/530, loss: 0.005199359729886055 2023-01-22 20:24:23.823423: step: 1708/530, loss: 0.0060662259347736835 2023-01-22 20:24:24.913900: step: 1712/530, loss: 0.0009265231783501804 2023-01-22 20:24:26.009838: step: 1716/530, loss: 0.0 2023-01-22 20:24:27.121447: step: 1720/530, loss: 0.0019822362810373306 2023-01-22 20:24:28.211686: step: 1724/530, loss: 3.788025787798688e-05 2023-01-22 20:24:29.317624: step: 1728/530, loss: 0.005469823721796274 2023-01-22 20:24:30.408605: step: 1732/530, loss: 0.004149814136326313 2023-01-22 20:24:31.498489: step: 1736/530, loss: 0.0017180907307192683 2023-01-22 20:24:32.572817: step: 1740/530, loss: 0.00011590938083827496 2023-01-22 20:24:33.674815: step: 1744/530, loss: 0.0024439338594675064 2023-01-22 20:24:34.767455: step: 1748/530, loss: 0.0024968907237052917 2023-01-22 20:24:35.873533: step: 1752/530, loss: 0.005898426752537489 2023-01-22 20:24:36.963618: step: 1756/530, loss: 0.002481900155544281 2023-01-22 20:24:38.049169: step: 1760/530, loss: 0.0011037297081202269 2023-01-22 20:24:39.153116: step: 1764/530, loss: 0.0024954553227871656 2023-01-22 20:24:40.220207: step: 1768/530, loss: 0.0024645228404551744 2023-01-22 20:24:41.318580: step: 1772/530, loss: 0.0009285281994380057 2023-01-22 20:24:42.391980: step: 1776/530, loss: 0.003900257172062993 2023-01-22 20:24:43.496275: step: 1780/530, loss: 0.003312863875180483 2023-01-22 20:24:44.591602: step: 1784/530, loss: 0.003721606684848666 2023-01-22 20:24:45.663225: step: 1788/530, loss: 3.9572481909999624e-05 2023-01-22 20:24:46.751248: step: 1792/530, loss: 0.014231804758310318 2023-01-22 20:24:47.834779: step: 1796/530, loss: 0.0001211568815051578 2023-01-22 20:24:48.934306: step: 1800/530, loss: 0.02522517926990986 2023-01-22 20:24:50.011252: step: 1804/530, loss: 0.0030734154861420393 2023-01-22 20:24:51.105251: step: 1808/530, loss: 0.0008686508517712355 2023-01-22 20:24:52.208704: step: 1812/530, loss: 0.0011809499701485038 2023-01-22 20:24:53.292458: step: 1816/530, loss: 0.0007994048064574599 2023-01-22 20:24:54.363619: step: 1820/530, loss: 0.002967127598822117 2023-01-22 20:24:55.447558: step: 1824/530, loss: 9.524337656330317e-06 2023-01-22 20:24:56.526932: step: 1828/530, loss: 0.004406691994518042 2023-01-22 20:24:57.621622: step: 1832/530, loss: 0.0013986529083922505 2023-01-22 20:24:58.732393: step: 1836/530, loss: 0.0016440274193882942 2023-01-22 20:24:59.808765: step: 1840/530, loss: 0.009066744707524776 2023-01-22 20:25:00.865039: step: 1844/530, loss: 0.0002761918876785785 2023-01-22 20:25:01.940793: step: 1848/530, loss: 0.0011494659120216966 2023-01-22 20:25:03.015863: step: 1852/530, loss: 0.0006082436884753406 2023-01-22 20:25:04.099092: step: 1856/530, loss: 0.005805442109704018 2023-01-22 20:25:05.212579: step: 1860/530, loss: 0.0016728354385122657 2023-01-22 20:25:06.269498: step: 1864/530, loss: 0.0005908252205699682 2023-01-22 20:25:07.349969: step: 1868/530, loss: 0.0031077589374035597 2023-01-22 20:25:08.431544: step: 1872/530, loss: 0.0036844387650489807 2023-01-22 20:25:09.510330: step: 1876/530, loss: 0.0021285268012434244 2023-01-22 20:25:10.589439: step: 1880/530, loss: 0.006949524860829115 2023-01-22 20:25:11.682835: step: 1884/530, loss: 0.002678863937035203 2023-01-22 20:25:12.799653: step: 1888/530, loss: 0.004842081572860479 2023-01-22 20:25:13.865392: step: 1892/530, loss: 0.0006235690088942647 2023-01-22 20:25:14.960749: step: 1896/530, loss: 0.0004585866117849946 2023-01-22 20:25:16.050436: step: 1900/530, loss: 0.008985369466245174 2023-01-22 20:25:17.122558: step: 1904/530, loss: 0.0001941321970662102 2023-01-22 20:25:18.188763: step: 1908/530, loss: 0.009316373616456985 2023-01-22 20:25:19.264391: step: 1912/530, loss: 0.0 2023-01-22 20:25:20.364762: step: 1916/530, loss: 0.006425163708627224 2023-01-22 20:25:21.454409: step: 1920/530, loss: 0.0010336049599573016 2023-01-22 20:25:22.548954: step: 1924/530, loss: 0.0001332381652900949 2023-01-22 20:25:23.623175: step: 1928/530, loss: 0.013687378726899624 2023-01-22 20:25:24.708845: step: 1932/530, loss: 0.0021381631959229708 2023-01-22 20:25:25.798267: step: 1936/530, loss: 0.00012012131628580391 2023-01-22 20:25:26.880020: step: 1940/530, loss: 0.00014436228957492858 2023-01-22 20:25:27.972380: step: 1944/530, loss: 0.015538678504526615 2023-01-22 20:25:29.046257: step: 1948/530, loss: 0.0001945592084666714 2023-01-22 20:25:30.141337: step: 1952/530, loss: 0.0036120894365012646 2023-01-22 20:25:31.226884: step: 1956/530, loss: 8.194353540602606e-06 2023-01-22 20:25:32.324149: step: 1960/530, loss: 0.005616932641714811 2023-01-22 20:25:33.430767: step: 1964/530, loss: 0.005948303733021021 2023-01-22 20:25:34.523823: step: 1968/530, loss: 0.00020649051293730736 2023-01-22 20:25:35.591205: step: 1972/530, loss: 0.0004324015462771058 2023-01-22 20:25:36.697767: step: 1976/530, loss: 8.814790635369718e-05 2023-01-22 20:25:37.780491: step: 1980/530, loss: 0.00025432216352783144 2023-01-22 20:25:38.872631: step: 1984/530, loss: 0.00011884964624186978 2023-01-22 20:25:39.952306: step: 1988/530, loss: 0.00917538907378912 2023-01-22 20:25:41.013510: step: 1992/530, loss: 0.0002176128327846527 2023-01-22 20:25:42.115890: step: 1996/530, loss: 0.004938729107379913 2023-01-22 20:25:43.209950: step: 2000/530, loss: 0.000126317361718975 2023-01-22 20:25:44.290142: step: 2004/530, loss: 0.017990481108427048 2023-01-22 20:25:45.374256: step: 2008/530, loss: 0.003084475640207529 2023-01-22 20:25:46.460329: step: 2012/530, loss: 0.005482024978846312 2023-01-22 20:25:47.548485: step: 2016/530, loss: 0.006015224382281303 2023-01-22 20:25:48.692199: step: 2020/530, loss: 0.001774609205313027 2023-01-22 20:25:49.766616: step: 2024/530, loss: 0.005875098519027233 2023-01-22 20:25:50.844196: step: 2028/530, loss: 0.0021836848463863134 2023-01-22 20:25:51.937735: step: 2032/530, loss: 0.002014268422499299 2023-01-22 20:25:53.001972: step: 2036/530, loss: 0.0021670558489859104 2023-01-22 20:25:54.096480: step: 2040/530, loss: 0.003708336967974901 2023-01-22 20:25:55.186378: step: 2044/530, loss: 0.0014673734549432993 2023-01-22 20:25:56.281273: step: 2048/530, loss: 0.0003642119700089097 2023-01-22 20:25:57.383447: step: 2052/530, loss: 0.008844273164868355 2023-01-22 20:25:58.485245: step: 2056/530, loss: 0.0008772752480581403 2023-01-22 20:25:59.580440: step: 2060/530, loss: 0.0020840431097894907 2023-01-22 20:26:00.677945: step: 2064/530, loss: 0.00027094673714600503 2023-01-22 20:26:01.759300: step: 2068/530, loss: 0.000147123821079731 2023-01-22 20:26:02.839218: step: 2072/530, loss: 0.006090828217566013 2023-01-22 20:26:03.938400: step: 2076/530, loss: 0.009165171533823013 2023-01-22 20:26:05.000328: step: 2080/530, loss: 0.0060962350107729435 2023-01-22 20:26:06.085941: step: 2084/530, loss: 5.152806352271e-06 2023-01-22 20:26:07.149272: step: 2088/530, loss: 0.007182287517935038 2023-01-22 20:26:08.226099: step: 2092/530, loss: 0.004165596794337034 2023-01-22 20:26:09.302533: step: 2096/530, loss: 0.001052184379659593 2023-01-22 20:26:10.381826: step: 2100/530, loss: 0.007389001548290253 2023-01-22 20:26:11.468137: step: 2104/530, loss: 0.0018403733847662807 2023-01-22 20:26:12.528144: step: 2108/530, loss: 1.4677470971946605e-07 2023-01-22 20:26:13.604006: step: 2112/530, loss: 0.00014616147382184863 2023-01-22 20:26:14.680548: step: 2116/530, loss: 0.000502644048538059 2023-01-22 20:26:15.750694: step: 2120/530, loss: 0.002124864375218749 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3405777502606882, 'r': 0.35414915966386556, 'f1': 0.3472308970099668}, 'combined': 0.2558543451652387, 'stategy': 1, 'epoch': 16} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33241601408594385, 'r': 0.28408252835831405, 'f1': 0.3063545985816058}, 'combined': 0.19026232964541834, 'stategy': 1, 'epoch': 16} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3489662268453928, 'r': 0.3403579517998708, 'f1': 0.3446083392863245}, 'combined': 0.2539219342109759, 'stategy': 1, 'epoch': 16} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3189445718257113, 'r': 0.28487334160100625, 'f1': 0.30094769943429184}, 'combined': 0.18690436070129704, 'stategy': 1, 'epoch': 16} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3418776959829853, 'r': 0.3256595889629196, 'f1': 0.3335716295110954}, 'combined': 0.24578962174501767, 'stategy': 1, 'epoch': 16} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34412984191639157, 'r': 0.29215366638509055, 'f1': 0.3160188617705251}, 'combined': 0.19626434573116822, 'stategy': 1, 'epoch': 16} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 16} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.38636363636363635, 'r': 0.5543478260869565, 'f1': 0.4553571428571429}, 'combined': 0.22767857142857145, 'stategy': 1, 'epoch': 16} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 16} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 17 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 20:28:43.275888: step: 4/530, loss: 0.0034808169584721327 2023-01-22 20:28:44.368525: step: 8/530, loss: 0.0018997406587004662 2023-01-22 20:28:45.451265: step: 12/530, loss: 0.002144439844414592 2023-01-22 20:28:46.523279: step: 16/530, loss: 3.552175985532813e-05 2023-01-22 20:28:47.621240: step: 20/530, loss: 0.015589152462780476 2023-01-22 20:28:48.712224: step: 24/530, loss: 0.0011679998133331537 2023-01-22 20:28:49.809153: step: 28/530, loss: 0.0056754183024168015 2023-01-22 20:28:50.923957: step: 32/530, loss: 0.0048375255428254604 2023-01-22 20:28:51.996811: step: 36/530, loss: 0.0049126893281936646 2023-01-22 20:28:53.089889: step: 40/530, loss: 0.008735156618058681 2023-01-22 20:28:54.202528: step: 44/530, loss: 0.000172492626006715 2023-01-22 20:28:55.302795: step: 48/530, loss: 0.0001775828714016825 2023-01-22 20:28:56.403483: step: 52/530, loss: 0.0001304171746596694 2023-01-22 20:28:57.501875: step: 56/530, loss: 6.779382965760306e-05 2023-01-22 20:28:58.624292: step: 60/530, loss: 0.0010022937785834074 2023-01-22 20:28:59.719345: step: 64/530, loss: 0.0010771224042400718 2023-01-22 20:29:00.800973: step: 68/530, loss: 1.5661638826713897e-05 2023-01-22 20:29:01.906234: step: 72/530, loss: 0.001393350656144321 2023-01-22 20:29:03.008526: step: 76/530, loss: 0.002266770461574197 2023-01-22 20:29:04.113640: step: 80/530, loss: 1.681139474385418e-05 2023-01-22 20:29:05.196815: step: 84/530, loss: 0.0007144093397073448 2023-01-22 20:29:06.275350: step: 88/530, loss: 0.001190351671539247 2023-01-22 20:29:07.357105: step: 92/530, loss: 0.0004423519130796194 2023-01-22 20:29:08.450958: step: 96/530, loss: 0.0002996137482114136 2023-01-22 20:29:09.527339: step: 100/530, loss: 0.010776826180517673 2023-01-22 20:29:10.607885: step: 104/530, loss: 0.0009892707457765937 2023-01-22 20:29:11.724938: step: 108/530, loss: 0.003703233553096652 2023-01-22 20:29:12.805219: step: 112/530, loss: 0.004948604851961136 2023-01-22 20:29:13.881721: step: 116/530, loss: 3.733527762506128e-07 2023-01-22 20:29:14.952887: step: 120/530, loss: 0.004020960070192814 2023-01-22 20:29:16.033401: step: 124/530, loss: 0.0008976784883998334 2023-01-22 20:29:17.118333: step: 128/530, loss: 0.0017104309517890215 2023-01-22 20:29:18.215854: step: 132/530, loss: 0.0011665651109069586 2023-01-22 20:29:19.294117: step: 136/530, loss: 7.510670548072085e-05 2023-01-22 20:29:20.389936: step: 140/530, loss: 0.006148394662886858 2023-01-22 20:29:21.475380: step: 144/530, loss: 0.003674423089250922 2023-01-22 20:29:22.540666: step: 148/530, loss: 0.005385248456150293 2023-01-22 20:29:23.638378: step: 152/530, loss: 0.006293687969446182 2023-01-22 20:29:24.716745: step: 156/530, loss: 0.0004134675255045295 2023-01-22 20:29:25.795160: step: 160/530, loss: 0.0027773447800427675 2023-01-22 20:29:26.879823: step: 164/530, loss: 0.03866887837648392 2023-01-22 20:29:27.979662: step: 168/530, loss: 0.0017375019378960133 2023-01-22 20:29:29.065513: step: 172/530, loss: 0.001592339831404388 2023-01-22 20:29:30.161440: step: 176/530, loss: 0.012710786424577236 2023-01-22 20:29:31.259586: step: 180/530, loss: 0.02182740904390812 2023-01-22 20:29:32.351691: step: 184/530, loss: 7.350520900217816e-05 2023-01-22 20:29:33.443065: step: 188/530, loss: 0.007247790694236755 2023-01-22 20:29:34.528293: step: 192/530, loss: 0.0032906096894294024 2023-01-22 20:29:35.618801: step: 196/530, loss: 0.0011998474365100265 2023-01-22 20:29:36.691823: step: 200/530, loss: 0.002117785392329097 2023-01-22 20:29:37.779259: step: 204/530, loss: 0.0002837668580468744 2023-01-22 20:29:38.893571: step: 208/530, loss: 0.0007688378682360053 2023-01-22 20:29:39.996678: step: 212/530, loss: 7.450579597723106e-10 2023-01-22 20:29:41.085937: step: 216/530, loss: 0.0013182366965338588 2023-01-22 20:29:42.150890: step: 220/530, loss: 0.0015739495866000652 2023-01-22 20:29:43.228083: step: 224/530, loss: 0.00012653223529923707 2023-01-22 20:29:44.329326: step: 228/530, loss: 0.0036604790948331356 2023-01-22 20:29:45.414452: step: 232/530, loss: 0.0034920531325042248 2023-01-22 20:29:46.485705: step: 236/530, loss: 0.00047044819802977145 2023-01-22 20:29:47.563078: step: 240/530, loss: 0.0003440014261286706 2023-01-22 20:29:48.636372: step: 244/530, loss: 0.006319877225905657 2023-01-22 20:29:49.727683: step: 248/530, loss: 0.0071740709245204926 2023-01-22 20:29:50.826837: step: 252/530, loss: 0.006342435721307993 2023-01-22 20:29:51.906800: step: 256/530, loss: 8.749008884478826e-06 2023-01-22 20:29:52.998490: step: 260/530, loss: 0.0001330746745225042 2023-01-22 20:29:54.069958: step: 264/530, loss: 0.001663908245973289 2023-01-22 20:29:55.187679: step: 268/530, loss: 0.0046469164080917835 2023-01-22 20:29:56.289868: step: 272/530, loss: 0.0023898312356323004 2023-01-22 20:29:57.380033: step: 276/530, loss: 0.0023684173356741667 2023-01-22 20:29:58.462039: step: 280/530, loss: 0.004610610194504261 2023-01-22 20:29:59.526749: step: 284/530, loss: 4.1727969801286235e-05 2023-01-22 20:30:00.621078: step: 288/530, loss: 0.0047868299297988415 2023-01-22 20:30:01.719022: step: 292/530, loss: 0.0014362818328663707 2023-01-22 20:30:02.834759: step: 296/530, loss: 0.013098294846713543 2023-01-22 20:30:03.934218: step: 300/530, loss: 0.000280734762782231 2023-01-22 20:30:05.029243: step: 304/530, loss: 0.0012219070922583342 2023-01-22 20:30:06.101910: step: 308/530, loss: 0.0007669119513593614 2023-01-22 20:30:07.204404: step: 312/530, loss: 1.3020689038967248e-05 2023-01-22 20:30:08.293303: step: 316/530, loss: 0.009945424273610115 2023-01-22 20:30:09.366877: step: 320/530, loss: 0.0043518198654055595 2023-01-22 20:30:10.451957: step: 324/530, loss: 0.00011538516264408827 2023-01-22 20:30:11.519119: step: 328/530, loss: 9.029215289046988e-05 2023-01-22 20:30:12.621219: step: 332/530, loss: 0.0002399556979071349 2023-01-22 20:30:13.700930: step: 336/530, loss: 0.007572166156023741 2023-01-22 20:30:14.763447: step: 340/530, loss: 0.0001940718648256734 2023-01-22 20:30:15.840813: step: 344/530, loss: 0.0036341894883662462 2023-01-22 20:30:16.925231: step: 348/530, loss: 0.000201019603991881 2023-01-22 20:30:18.016488: step: 352/530, loss: 0.0007032624562270939 2023-01-22 20:30:19.101813: step: 356/530, loss: 0.000679805816616863 2023-01-22 20:30:20.198704: step: 360/530, loss: 0.002421688986942172 2023-01-22 20:30:21.303841: step: 364/530, loss: 0.015139338560402393 2023-01-22 20:30:22.382926: step: 368/530, loss: 0.0007957784691825509 2023-01-22 20:30:23.463359: step: 372/530, loss: 0.0026553990319371223 2023-01-22 20:30:24.558319: step: 376/530, loss: 0.0024460679851472378 2023-01-22 20:30:25.666281: step: 380/530, loss: 0.0027359339874237776 2023-01-22 20:30:26.757869: step: 384/530, loss: 0.005867304280400276 2023-01-22 20:30:27.876508: step: 388/530, loss: 0.004757972899824381 2023-01-22 20:30:28.940445: step: 392/530, loss: 4.183263808954507e-05 2023-01-22 20:30:30.026005: step: 396/530, loss: 2.556456092861481e-05 2023-01-22 20:30:31.115331: step: 400/530, loss: 0.0015227266121655703 2023-01-22 20:30:32.217604: step: 404/530, loss: 6.342248525470495e-05 2023-01-22 20:30:33.290292: step: 408/530, loss: 0.0014097301755100489 2023-01-22 20:30:34.360537: step: 412/530, loss: 0.00048197878641076386 2023-01-22 20:30:35.443430: step: 416/530, loss: 0.002813866129145026 2023-01-22 20:30:36.542302: step: 420/530, loss: 2.2102161892689764e-05 2023-01-22 20:30:37.626358: step: 424/530, loss: 0.0030066766776144505 2023-01-22 20:30:38.704094: step: 428/530, loss: 0.00028449707315303385 2023-01-22 20:30:39.797042: step: 432/530, loss: 0.0026070221792906523 2023-01-22 20:30:40.881920: step: 436/530, loss: 0.0037741651758551598 2023-01-22 20:30:41.949804: step: 440/530, loss: 0.002109530149027705 2023-01-22 20:30:43.010927: step: 444/530, loss: 0.002431826665997505 2023-01-22 20:30:44.106631: step: 448/530, loss: 0.0010731664951890707 2023-01-22 20:30:45.174417: step: 452/530, loss: 0.0021129047963768244 2023-01-22 20:30:46.278899: step: 456/530, loss: 0.004795182030647993 2023-01-22 20:30:47.369202: step: 460/530, loss: 0.00022948479454498738 2023-01-22 20:30:48.477046: step: 464/530, loss: 0.0052319359965622425 2023-01-22 20:30:49.568331: step: 468/530, loss: 0.0003693769103847444 2023-01-22 20:30:50.665290: step: 472/530, loss: 0.017211947590112686 2023-01-22 20:30:51.746872: step: 476/530, loss: 0.01170080341398716 2023-01-22 20:30:52.859133: step: 480/530, loss: 0.0010586120188236237 2023-01-22 20:30:53.923244: step: 484/530, loss: 0.00043138189357705414 2023-01-22 20:30:54.983450: step: 488/530, loss: 0.003336365567520261 2023-01-22 20:30:56.104049: step: 492/530, loss: 0.0015763710252940655 2023-01-22 20:30:57.204872: step: 496/530, loss: 0.0006782274576835334 2023-01-22 20:30:58.282486: step: 500/530, loss: 2.6213465389446355e-05 2023-01-22 20:30:59.381846: step: 504/530, loss: 0.003002919489517808 2023-01-22 20:31:00.463707: step: 508/530, loss: 0.0065875910222530365 2023-01-22 20:31:01.542323: step: 512/530, loss: 0.0010819419985637069 2023-01-22 20:31:02.642561: step: 516/530, loss: 0.0004035773454234004 2023-01-22 20:31:03.726477: step: 520/530, loss: 0.0004645856097340584 2023-01-22 20:31:04.836444: step: 524/530, loss: 0.0009050294174812734 2023-01-22 20:31:05.922053: step: 528/530, loss: 3.505948552628979e-05 2023-01-22 20:31:06.998953: step: 532/530, loss: 0.0036793684121221304 2023-01-22 20:31:08.097989: step: 536/530, loss: 0.011716824024915695 2023-01-22 20:31:09.200975: step: 540/530, loss: 0.007206967566162348 2023-01-22 20:31:10.281819: step: 544/530, loss: 0.009051250293850899 2023-01-22 20:31:11.375770: step: 548/530, loss: 0.00013011842384003103 2023-01-22 20:31:12.471914: step: 552/530, loss: 5.353549113351619e-06 2023-01-22 20:31:13.554156: step: 556/530, loss: 0.0006024892209097743 2023-01-22 20:31:14.671526: step: 560/530, loss: 0.004242273513227701 2023-01-22 20:31:15.762143: step: 564/530, loss: 0.00017575321544427425 2023-01-22 20:31:16.844421: step: 568/530, loss: 0.00044714190880768 2023-01-22 20:31:17.935890: step: 572/530, loss: 0.0032757045701146126 2023-01-22 20:31:19.009788: step: 576/530, loss: 0.000928366556763649 2023-01-22 20:31:20.095833: step: 580/530, loss: 0.0011983714066445827 2023-01-22 20:31:21.172344: step: 584/530, loss: 0.0004430399276316166 2023-01-22 20:31:22.244224: step: 588/530, loss: 0.003928348422050476 2023-01-22 20:31:23.322706: step: 592/530, loss: 3.2033615298132645e-06 2023-01-22 20:31:24.387853: step: 596/530, loss: 0.0027793985791504383 2023-01-22 20:31:25.462682: step: 600/530, loss: 0.003533866023644805 2023-01-22 20:31:26.557981: step: 604/530, loss: 0.0006644558743573725 2023-01-22 20:31:27.631396: step: 608/530, loss: 0.00011873383482452482 2023-01-22 20:31:28.726472: step: 612/530, loss: 0.0005890467436984181 2023-01-22 20:31:29.836444: step: 616/530, loss: 0.004688585177063942 2023-01-22 20:31:30.934633: step: 620/530, loss: 0.0012207345571368933 2023-01-22 20:31:32.022473: step: 624/530, loss: 0.0003617858747020364 2023-01-22 20:31:33.106386: step: 628/530, loss: 0.0005774375167675316 2023-01-22 20:31:34.185716: step: 632/530, loss: 0.00032479382934980094 2023-01-22 20:31:35.267952: step: 636/530, loss: 0.00042347575072199106 2023-01-22 20:31:36.348025: step: 640/530, loss: 0.0021121923346072435 2023-01-22 20:31:37.417147: step: 644/530, loss: 2.1308244413376087e-06 2023-01-22 20:31:38.493560: step: 648/530, loss: 0.0008518691174685955 2023-01-22 20:31:39.580566: step: 652/530, loss: 0.006940099410712719 2023-01-22 20:31:40.682924: step: 656/530, loss: 0.0061613707803189754 2023-01-22 20:31:41.801468: step: 660/530, loss: 0.0011795359896495938 2023-01-22 20:31:42.867841: step: 664/530, loss: 0.0006289535667747259 2023-01-22 20:31:43.961581: step: 668/530, loss: 0.020524267107248306 2023-01-22 20:31:45.041397: step: 672/530, loss: 0.0005878504598513246 2023-01-22 20:31:46.109914: step: 676/530, loss: 0.00021731419838033617 2023-01-22 20:31:47.188411: step: 680/530, loss: 0.0005742923240177333 2023-01-22 20:31:48.261061: step: 684/530, loss: 0.0007030502310954034 2023-01-22 20:31:49.363532: step: 688/530, loss: 0.003954659681767225 2023-01-22 20:31:50.437691: step: 692/530, loss: 0.00017020836821757257 2023-01-22 20:31:51.510075: step: 696/530, loss: 0.0005727845709770918 2023-01-22 20:31:52.624661: step: 700/530, loss: 0.0015427382895722985 2023-01-22 20:31:53.705158: step: 704/530, loss: 0.0013018085155636072 2023-01-22 20:31:54.804865: step: 708/530, loss: 0.0025435348507016897 2023-01-22 20:31:55.907270: step: 712/530, loss: 0.001990637741982937 2023-01-22 20:31:57.011583: step: 716/530, loss: 0.0019166427664458752 2023-01-22 20:31:58.111263: step: 720/530, loss: 0.001076818909496069 2023-01-22 20:31:59.203691: step: 724/530, loss: 0.0005725253722630441 2023-01-22 20:32:00.292557: step: 728/530, loss: 0.0002605449699331075 2023-01-22 20:32:01.378916: step: 732/530, loss: 0.004124950151890516 2023-01-22 20:32:02.479953: step: 736/530, loss: 0.004425158724188805 2023-01-22 20:32:03.568813: step: 740/530, loss: 0.0020203827880322933 2023-01-22 20:32:04.665394: step: 744/530, loss: 0.0019976019393652678 2023-01-22 20:32:05.728395: step: 748/530, loss: 2.617143400129862e-05 2023-01-22 20:32:06.781041: step: 752/530, loss: 0.0009109968086704612 2023-01-22 20:32:07.869377: step: 756/530, loss: 0.007275097072124481 2023-01-22 20:32:08.977247: step: 760/530, loss: 0.005125010851770639 2023-01-22 20:32:10.093467: step: 764/530, loss: 0.010058313608169556 2023-01-22 20:32:11.173886: step: 768/530, loss: 0.0005352284642867744 2023-01-22 20:32:12.274661: step: 772/530, loss: 1.1774956874432974e-05 2023-01-22 20:32:13.382138: step: 776/530, loss: 0.012429129332304 2023-01-22 20:32:14.474596: step: 780/530, loss: 0.001796990865841508 2023-01-22 20:32:15.573267: step: 784/530, loss: 0.0007893404690548778 2023-01-22 20:32:16.664136: step: 788/530, loss: 0.00015968702791724354 2023-01-22 20:32:17.730302: step: 792/530, loss: 0.00026670395163819194 2023-01-22 20:32:18.840292: step: 796/530, loss: 3.1496165320277214e-05 2023-01-22 20:32:19.904783: step: 800/530, loss: 0.002667137887328863 2023-01-22 20:32:20.979311: step: 804/530, loss: 0.00022116818581707776 2023-01-22 20:32:22.065191: step: 808/530, loss: 0.0009400615817867219 2023-01-22 20:32:23.142395: step: 812/530, loss: 0.002219259273260832 2023-01-22 20:32:24.230097: step: 816/530, loss: 0.007406312972307205 2023-01-22 20:32:25.310128: step: 820/530, loss: 0.0002881985856220126 2023-01-22 20:32:26.388545: step: 824/530, loss: 0.0003620398638304323 2023-01-22 20:32:27.466376: step: 828/530, loss: 0.0003469117218628526 2023-01-22 20:32:28.567650: step: 832/530, loss: 0.0004634088254533708 2023-01-22 20:32:29.666817: step: 836/530, loss: 0.0006332676275633276 2023-01-22 20:32:30.738189: step: 840/530, loss: 0.0031147710978984833 2023-01-22 20:32:31.816557: step: 844/530, loss: 0.0006185956299304962 2023-01-22 20:32:32.896184: step: 848/530, loss: 0.0004379435849841684 2023-01-22 20:32:33.980343: step: 852/530, loss: 1.5504343537031673e-05 2023-01-22 20:32:35.054722: step: 856/530, loss: 0.00041991108446381986 2023-01-22 20:32:36.134808: step: 860/530, loss: 0.0004991637542843819 2023-01-22 20:32:37.234114: step: 864/530, loss: 0.006516980938613415 2023-01-22 20:32:38.302431: step: 868/530, loss: 0.0015845214948058128 2023-01-22 20:32:39.367428: step: 872/530, loss: 3.6916717363055795e-05 2023-01-22 20:32:40.458224: step: 876/530, loss: 0.001291735447011888 2023-01-22 20:32:41.552918: step: 880/530, loss: 0.0018934139516204596 2023-01-22 20:32:42.647136: step: 884/530, loss: 0.0011029306333512068 2023-01-22 20:32:43.755529: step: 888/530, loss: 0.00016446737572550774 2023-01-22 20:32:44.860164: step: 892/530, loss: 0.0022822474129498005 2023-01-22 20:32:45.953391: step: 896/530, loss: 0.0025672889314591885 2023-01-22 20:32:47.057594: step: 900/530, loss: 0.0005073066568002105 2023-01-22 20:32:48.143440: step: 904/530, loss: 0.002016980666667223 2023-01-22 20:32:49.213141: step: 908/530, loss: 0.0032625554595142603 2023-01-22 20:32:50.286268: step: 912/530, loss: 0.0012266021221876144 2023-01-22 20:32:51.369662: step: 916/530, loss: 0.010914864018559456 2023-01-22 20:32:52.453819: step: 920/530, loss: 0.005537052173167467 2023-01-22 20:32:53.566756: step: 924/530, loss: 0.0038829047698527575 2023-01-22 20:32:54.651475: step: 928/530, loss: 0.0007737540872767568 2023-01-22 20:32:55.733319: step: 932/530, loss: 0.0021450240164995193 2023-01-22 20:32:56.842593: step: 936/530, loss: 0.010253152810037136 2023-01-22 20:32:57.933914: step: 940/530, loss: 0.0017688992666080594 2023-01-22 20:32:59.012407: step: 944/530, loss: 0.00901026651263237 2023-01-22 20:33:00.099151: step: 948/530, loss: 0.001152405864559114 2023-01-22 20:33:01.193646: step: 952/530, loss: 0.0035532780457288027 2023-01-22 20:33:02.287372: step: 956/530, loss: 0.006383465602993965 2023-01-22 20:33:03.382833: step: 960/530, loss: 0.0009306279825977981 2023-01-22 20:33:04.446523: step: 964/530, loss: 0.00040455852285958827 2023-01-22 20:33:05.531752: step: 968/530, loss: 0.00017179954738821834 2023-01-22 20:33:06.622694: step: 972/530, loss: 0.0007859966717660427 2023-01-22 20:33:07.715674: step: 976/530, loss: 2.7183359634364024e-05 2023-01-22 20:33:08.796309: step: 980/530, loss: 8.094224540400319e-06 2023-01-22 20:33:09.878292: step: 984/530, loss: 0.007210175506770611 2023-01-22 20:33:10.957406: step: 988/530, loss: 0.0008191528613679111 2023-01-22 20:33:12.040708: step: 992/530, loss: 0.003515303134918213 2023-01-22 20:33:13.148015: step: 996/530, loss: 0.0017188818892464042 2023-01-22 20:33:14.253560: step: 1000/530, loss: 0.0029762466438114643 2023-01-22 20:33:15.344042: step: 1004/530, loss: 5.2656214393209666e-05 2023-01-22 20:33:16.434365: step: 1008/530, loss: 0.0002444193232804537 2023-01-22 20:33:17.519369: step: 1012/530, loss: 0.009162704460322857 2023-01-22 20:33:18.606297: step: 1016/530, loss: 0.005453592631965876 2023-01-22 20:33:19.694287: step: 1020/530, loss: 0.0015048424247652292 2023-01-22 20:33:20.765319: step: 1024/530, loss: 0.005734096746891737 2023-01-22 20:33:21.837302: step: 1028/530, loss: 0.017995981499552727 2023-01-22 20:33:22.915914: step: 1032/530, loss: 0.004703155253082514 2023-01-22 20:33:23.989488: step: 1036/530, loss: 0.005158161278814077 2023-01-22 20:33:25.084891: step: 1040/530, loss: 0.00500600878149271 2023-01-22 20:33:26.183065: step: 1044/530, loss: 0.0024152242112904787 2023-01-22 20:33:27.255915: step: 1048/530, loss: 0.01518117357045412 2023-01-22 20:33:28.339211: step: 1052/530, loss: 0.007749086711555719 2023-01-22 20:33:29.436296: step: 1056/530, loss: 0.0002087807224597782 2023-01-22 20:33:30.541663: step: 1060/530, loss: 0.00011596120020840317 2023-01-22 20:33:31.623098: step: 1064/530, loss: 0.014991536736488342 2023-01-22 20:33:32.719280: step: 1068/530, loss: 0.0021489278879016638 2023-01-22 20:33:33.784444: step: 1072/530, loss: 0.0007681234274059534 2023-01-22 20:33:34.855114: step: 1076/530, loss: 0.0020727748051285744 2023-01-22 20:33:35.934333: step: 1080/530, loss: 0.0010961415246129036 2023-01-22 20:33:37.014598: step: 1084/530, loss: 7.461431778210681e-06 2023-01-22 20:33:38.103072: step: 1088/530, loss: 0.00016314793901983649 2023-01-22 20:33:39.199476: step: 1092/530, loss: 0.007404114585369825 2023-01-22 20:33:40.277418: step: 1096/530, loss: 0.004782171454280615 2023-01-22 20:33:41.381068: step: 1100/530, loss: 1.4867505342408549e-05 2023-01-22 20:33:42.476077: step: 1104/530, loss: 0.0091378940269351 2023-01-22 20:33:43.573883: step: 1108/530, loss: 0.016494134441018105 2023-01-22 20:33:44.681511: step: 1112/530, loss: 0.006772821303457022 2023-01-22 20:33:45.767450: step: 1116/530, loss: 0.0002630894596222788 2023-01-22 20:33:46.838864: step: 1120/530, loss: 0.0004232735082041472 2023-01-22 20:33:47.928059: step: 1124/530, loss: 0.0010103174718096852 2023-01-22 20:33:48.997412: step: 1128/530, loss: 0.002713279565796256 2023-01-22 20:33:50.083230: step: 1132/530, loss: 0.006466195452958345 2023-01-22 20:33:51.183932: step: 1136/530, loss: 0.0029782913625240326 2023-01-22 20:33:52.258096: step: 1140/530, loss: 0.00022127982811070979 2023-01-22 20:33:53.346162: step: 1144/530, loss: 0.009942966513335705 2023-01-22 20:33:54.421713: step: 1148/530, loss: 0.012226640246808529 2023-01-22 20:33:55.516415: step: 1152/530, loss: 0.0041862293146550655 2023-01-22 20:33:56.594466: step: 1156/530, loss: 0.018717629835009575 2023-01-22 20:33:57.678592: step: 1160/530, loss: 0.001450053765438497 2023-01-22 20:33:58.758648: step: 1164/530, loss: 0.0034925302024930716 2023-01-22 20:33:59.840356: step: 1168/530, loss: 0.003703951369971037 2023-01-22 20:34:00.949721: step: 1172/530, loss: 0.0004603114794008434 2023-01-22 20:34:02.024804: step: 1176/530, loss: 5.0427173846401274e-05 2023-01-22 20:34:03.100393: step: 1180/530, loss: 0.003371449885889888 2023-01-22 20:34:04.187194: step: 1184/530, loss: 0.0032470007427036762 2023-01-22 20:34:05.299105: step: 1188/530, loss: 0.0021416267845779657 2023-01-22 20:34:06.362282: step: 1192/530, loss: 0.0005429533775895834 2023-01-22 20:34:07.440944: step: 1196/530, loss: 0.00465348968282342 2023-01-22 20:34:08.534225: step: 1200/530, loss: 0.001009253435768187 2023-01-22 20:34:09.634081: step: 1204/530, loss: 0.030110033228993416 2023-01-22 20:34:10.715326: step: 1208/530, loss: 0.00037223813706077635 2023-01-22 20:34:11.810215: step: 1212/530, loss: 0.0025553249288350344 2023-01-22 20:34:12.897754: step: 1216/530, loss: 0.006032499950379133 2023-01-22 20:34:13.985447: step: 1220/530, loss: 4.047404581797309e-05 2023-01-22 20:34:15.080206: step: 1224/530, loss: 0.000852379307616502 2023-01-22 20:34:16.172428: step: 1228/530, loss: 7.200497930170968e-05 2023-01-22 20:34:17.281316: step: 1232/530, loss: 0.0014304049545899034 2023-01-22 20:34:18.360386: step: 1236/530, loss: 0.004008917603641748 2023-01-22 20:34:19.445791: step: 1240/530, loss: 0.007127148099243641 2023-01-22 20:34:20.544898: step: 1244/530, loss: 0.01821468025445938 2023-01-22 20:34:21.616038: step: 1248/530, loss: 1.0921195098489989e-05 2023-01-22 20:34:22.690620: step: 1252/530, loss: 0.028740478679537773 2023-01-22 20:34:23.776520: step: 1256/530, loss: 1.7588701666682027e-05 2023-01-22 20:34:24.863866: step: 1260/530, loss: 0.002110525267198682 2023-01-22 20:34:25.948721: step: 1264/530, loss: 0.001676070154644549 2023-01-22 20:34:27.054692: step: 1268/530, loss: 0.004911639727652073 2023-01-22 20:34:28.135750: step: 1272/530, loss: 0.001979612745344639 2023-01-22 20:34:29.211422: step: 1276/530, loss: 0.000550492259208113 2023-01-22 20:34:30.315721: step: 1280/530, loss: 0.004401945509016514 2023-01-22 20:34:31.397664: step: 1284/530, loss: 0.004540633875876665 2023-01-22 20:34:32.493816: step: 1288/530, loss: 0.0009680314688012004 2023-01-22 20:34:33.571165: step: 1292/530, loss: 0.003358195535838604 2023-01-22 20:34:34.630691: step: 1296/530, loss: 0.00045573891839012504 2023-01-22 20:34:35.744464: step: 1300/530, loss: 0.0012548742815852165 2023-01-22 20:34:36.825481: step: 1304/530, loss: 0.010721873492002487 2023-01-22 20:34:37.887467: step: 1308/530, loss: 0.00015493064711336046 2023-01-22 20:34:38.974514: step: 1312/530, loss: 0.0010917402105405927 2023-01-22 20:34:40.064602: step: 1316/530, loss: 0.0031570803839713335 2023-01-22 20:34:41.160006: step: 1320/530, loss: 0.008043994195759296 2023-01-22 20:34:42.252986: step: 1324/530, loss: 0.0012500904267653823 2023-01-22 20:34:43.325016: step: 1328/530, loss: 0.018676310777664185 2023-01-22 20:34:44.406028: step: 1332/530, loss: 4.9612197472015396e-05 2023-01-22 20:34:45.469844: step: 1336/530, loss: 0.006168786436319351 2023-01-22 20:34:46.552061: step: 1340/530, loss: 0.0004904735833406448 2023-01-22 20:34:47.633461: step: 1344/530, loss: 0.012654002755880356 2023-01-22 20:34:48.718165: step: 1348/530, loss: 0.0017332867719233036 2023-01-22 20:34:49.804688: step: 1352/530, loss: 0.005420266184955835 2023-01-22 20:34:50.882971: step: 1356/530, loss: 0.002804506104439497 2023-01-22 20:34:51.956791: step: 1360/530, loss: 0.005558534525334835 2023-01-22 20:34:53.061179: step: 1364/530, loss: 0.0014608752680942416 2023-01-22 20:34:54.138550: step: 1368/530, loss: 0.0015148414531722665 2023-01-22 20:34:55.220368: step: 1372/530, loss: 0.010762615129351616 2023-01-22 20:34:56.312610: step: 1376/530, loss: 0.002828380558639765 2023-01-22 20:34:57.408970: step: 1380/530, loss: 0.0029202981386333704 2023-01-22 20:34:58.476067: step: 1384/530, loss: 0.00023294426500797272 2023-01-22 20:34:59.573873: step: 1388/530, loss: 8.773962326813489e-05 2023-01-22 20:35:00.661851: step: 1392/530, loss: 0.003974469378590584 2023-01-22 20:35:01.742839: step: 1396/530, loss: 0.0005275339353829622 2023-01-22 20:35:02.837169: step: 1400/530, loss: 0.027599824592471123 2023-01-22 20:35:03.921872: step: 1404/530, loss: 0.0002456007932778448 2023-01-22 20:35:05.010051: step: 1408/530, loss: 0.00014337974425870925 2023-01-22 20:35:06.086679: step: 1412/530, loss: 0.0002336033940082416 2023-01-22 20:35:07.161828: step: 1416/530, loss: 3.7831738154636696e-05 2023-01-22 20:35:08.288621: step: 1420/530, loss: 0.005172450095415115 2023-01-22 20:35:09.367889: step: 1424/530, loss: 0.0027136385906487703 2023-01-22 20:35:10.468869: step: 1428/530, loss: 0.002548440359532833 2023-01-22 20:35:11.568016: step: 1432/530, loss: 0.04339786246418953 2023-01-22 20:35:12.649366: step: 1436/530, loss: 0.008410529233515263 2023-01-22 20:35:13.719005: step: 1440/530, loss: 0.008311120793223381 2023-01-22 20:35:14.807294: step: 1444/530, loss: 0.005648605991154909 2023-01-22 20:35:15.889602: step: 1448/530, loss: 0.00011642611934803426 2023-01-22 20:35:17.007134: step: 1452/530, loss: 0.0015221787616610527 2023-01-22 20:35:18.099794: step: 1456/530, loss: 0.002900173654779792 2023-01-22 20:35:19.199763: step: 1460/530, loss: 0.006394024472683668 2023-01-22 20:35:20.294592: step: 1464/530, loss: 0.0012230782303959131 2023-01-22 20:35:21.358882: step: 1468/530, loss: 0.001762936357408762 2023-01-22 20:35:22.436515: step: 1472/530, loss: 8.360754577552143e-07 2023-01-22 20:35:23.527619: step: 1476/530, loss: 0.002977677620947361 2023-01-22 20:35:24.604911: step: 1480/530, loss: 0.0016329261707141995 2023-01-22 20:35:25.685926: step: 1484/530, loss: 0.00017170999490190297 2023-01-22 20:35:26.764302: step: 1488/530, loss: 0.0024347316939383745 2023-01-22 20:35:27.824558: step: 1492/530, loss: 6.549506360897794e-05 2023-01-22 20:35:28.921637: step: 1496/530, loss: 0.0002729482657741755 2023-01-22 20:35:30.002401: step: 1500/530, loss: 0.012052626349031925 2023-01-22 20:35:31.084824: step: 1504/530, loss: 0.014203791506588459 2023-01-22 20:35:32.155912: step: 1508/530, loss: 0.0004855323350057006 2023-01-22 20:35:33.250417: step: 1512/530, loss: 8.177094423444942e-05 2023-01-22 20:35:34.337586: step: 1516/530, loss: 0.007196275983005762 2023-01-22 20:35:35.435387: step: 1520/530, loss: 0.0009334517526440322 2023-01-22 20:35:36.518577: step: 1524/530, loss: 0.0005425841081887484 2023-01-22 20:35:37.576899: step: 1528/530, loss: 0.0008515716763213277 2023-01-22 20:35:38.654321: step: 1532/530, loss: 0.0029152731876820326 2023-01-22 20:35:39.719647: step: 1536/530, loss: 0.0028622474055737257 2023-01-22 20:35:40.814582: step: 1540/530, loss: 0.0027356904465705156 2023-01-22 20:35:41.904957: step: 1544/530, loss: 0.0036398330703377724 2023-01-22 20:35:42.987334: step: 1548/530, loss: 0.00200962508097291 2023-01-22 20:35:44.065183: step: 1552/530, loss: 0.00031526293605566025 2023-01-22 20:35:45.162309: step: 1556/530, loss: 0.0007602398400194943 2023-01-22 20:35:46.247774: step: 1560/530, loss: 0.009113945998251438 2023-01-22 20:35:47.337175: step: 1564/530, loss: 0.004607424605637789 2023-01-22 20:35:48.425290: step: 1568/530, loss: 9.279806545237079e-05 2023-01-22 20:35:49.491780: step: 1572/530, loss: 0.0029641669243574142 2023-01-22 20:35:50.603378: step: 1576/530, loss: 0.00010851237311726436 2023-01-22 20:35:51.698469: step: 1580/530, loss: 0.003018486313521862 2023-01-22 20:35:52.767674: step: 1584/530, loss: 0.0002792272134684026 2023-01-22 20:35:53.889844: step: 1588/530, loss: 0.00010053430742118508 2023-01-22 20:35:54.979668: step: 1592/530, loss: 0.0003937681613024324 2023-01-22 20:35:56.058949: step: 1596/530, loss: 0.010704144835472107 2023-01-22 20:35:57.143762: step: 1600/530, loss: 5.881514880456962e-05 2023-01-22 20:35:58.244843: step: 1604/530, loss: 0.005205592606216669 2023-01-22 20:35:59.343466: step: 1608/530, loss: 0.0027847348246723413 2023-01-22 20:36:00.440410: step: 1612/530, loss: 0.00018132803961634636 2023-01-22 20:36:01.528969: step: 1616/530, loss: 0.009442429058253765 2023-01-22 20:36:02.612224: step: 1620/530, loss: 0.02821452170610428 2023-01-22 20:36:03.699207: step: 1624/530, loss: 0.00038336883881129324 2023-01-22 20:36:04.786150: step: 1628/530, loss: 1.556850111228414e-05 2023-01-22 20:36:05.867718: step: 1632/530, loss: 0.00011915427603526041 2023-01-22 20:36:06.974237: step: 1636/530, loss: 0.0033786995336413383 2023-01-22 20:36:08.050187: step: 1640/530, loss: 9.686307021183893e-05 2023-01-22 20:36:09.121614: step: 1644/530, loss: 0.0009107019286602736 2023-01-22 20:36:10.235902: step: 1648/530, loss: 0.010780328884720802 2023-01-22 20:36:11.332625: step: 1652/530, loss: 1.4698194718221202e-05 2023-01-22 20:36:12.430035: step: 1656/530, loss: 0.007394067943096161 2023-01-22 20:36:13.530861: step: 1660/530, loss: 0.0023417857009917498 2023-01-22 20:36:14.621500: step: 1664/530, loss: 0.004217495210468769 2023-01-22 20:36:15.707305: step: 1668/530, loss: 0.00412709079682827 2023-01-22 20:36:16.779170: step: 1672/530, loss: 0.0012540417956188321 2023-01-22 20:36:17.850076: step: 1676/530, loss: 0.0008241914911195636 2023-01-22 20:36:18.918409: step: 1680/530, loss: 0.0010481151985004544 2023-01-22 20:36:19.999142: step: 1684/530, loss: 0.0022604179102927446 2023-01-22 20:36:21.092271: step: 1688/530, loss: 0.0007706551696173847 2023-01-22 20:36:22.177594: step: 1692/530, loss: 0.001371414284221828 2023-01-22 20:36:23.287663: step: 1696/530, loss: 0.00046042041503824294 2023-01-22 20:36:24.356523: step: 1700/530, loss: 0.005168757401406765 2023-01-22 20:36:25.438261: step: 1704/530, loss: 4.6169079723767936e-05 2023-01-22 20:36:26.522188: step: 1708/530, loss: 0.0008091203635558486 2023-01-22 20:36:27.591175: step: 1712/530, loss: 0.001225824817083776 2023-01-22 20:36:28.687831: step: 1716/530, loss: 0.002943438710644841 2023-01-22 20:36:29.770769: step: 1720/530, loss: 0.0019306633621454239 2023-01-22 20:36:30.844704: step: 1724/530, loss: 0.0006289273151196539 2023-01-22 20:36:31.936000: step: 1728/530, loss: 0.0004547074204310775 2023-01-22 20:36:33.019996: step: 1732/530, loss: 0.003432940226048231 2023-01-22 20:36:34.093989: step: 1736/530, loss: 0.011345287784934044 2023-01-22 20:36:35.185640: step: 1740/530, loss: 0.0021766044665127993 2023-01-22 20:36:36.270061: step: 1744/530, loss: 0.0003303492267150432 2023-01-22 20:36:37.370050: step: 1748/530, loss: 0.00245128502137959 2023-01-22 20:36:38.468277: step: 1752/530, loss: 0.00047326594358310103 2023-01-22 20:36:39.567632: step: 1756/530, loss: 0.00010543585813138634 2023-01-22 20:36:40.647076: step: 1760/530, loss: 0.00010827576625160873 2023-01-22 20:36:41.727971: step: 1764/530, loss: 0.0006188526167534292 2023-01-22 20:36:42.804782: step: 1768/530, loss: 0.003043142845854163 2023-01-22 20:36:43.895229: step: 1772/530, loss: 0.0006010145880281925 2023-01-22 20:36:45.017874: step: 1776/530, loss: 0.006816300563514233 2023-01-22 20:36:46.096495: step: 1780/530, loss: 0.0022533806040883064 2023-01-22 20:36:47.180897: step: 1784/530, loss: 0.0029185237362980843 2023-01-22 20:36:48.254474: step: 1788/530, loss: 0.0009701751987449825 2023-01-22 20:36:49.334547: step: 1792/530, loss: 2.095879153785063e-06 2023-01-22 20:36:50.427912: step: 1796/530, loss: 0.0026495042257010937 2023-01-22 20:36:51.517556: step: 1800/530, loss: 0.001783812534995377 2023-01-22 20:36:52.593535: step: 1804/530, loss: 0.004000787157565355 2023-01-22 20:36:53.683633: step: 1808/530, loss: 0.02174878492951393 2023-01-22 20:36:54.746251: step: 1812/530, loss: 2.2332524167723022e-05 2023-01-22 20:36:55.842607: step: 1816/530, loss: 0.011863541789352894 2023-01-22 20:36:56.933327: step: 1820/530, loss: 0.005531518720090389 2023-01-22 20:36:58.017118: step: 1824/530, loss: 0.0023476574569940567 2023-01-22 20:36:59.130099: step: 1828/530, loss: 0.0008948675240390003 2023-01-22 20:37:00.222023: step: 1832/530, loss: 0.0019338495330885053 2023-01-22 20:37:01.284537: step: 1836/530, loss: 5.583491201832658e-06 2023-01-22 20:37:02.361827: step: 1840/530, loss: 0.00016705291636753827 2023-01-22 20:37:03.464528: step: 1844/530, loss: 0.0006547645898535848 2023-01-22 20:37:04.554553: step: 1848/530, loss: 7.919600466266274e-05 2023-01-22 20:37:05.643194: step: 1852/530, loss: 0.002055986085906625 2023-01-22 20:37:06.786283: step: 1856/530, loss: 0.0033276185858994722 2023-01-22 20:37:07.874920: step: 1860/530, loss: 9.616312308935449e-05 2023-01-22 20:37:08.978558: step: 1864/530, loss: 0.00048755662282928824 2023-01-22 20:37:10.058348: step: 1868/530, loss: 0.005983664188534021 2023-01-22 20:37:11.155342: step: 1872/530, loss: 0.002054516924545169 2023-01-22 20:37:12.295883: step: 1876/530, loss: 0.0007921885699033737 2023-01-22 20:37:13.373646: step: 1880/530, loss: 0.0007027360261417925 2023-01-22 20:37:14.453618: step: 1884/530, loss: 0.0013822525506839156 2023-01-22 20:37:15.558942: step: 1888/530, loss: 0.0022649893071502447 2023-01-22 20:37:16.640393: step: 1892/530, loss: 0.0004750127554871142 2023-01-22 20:37:17.717921: step: 1896/530, loss: 7.53599942981964e-06 2023-01-22 20:37:18.791763: step: 1900/530, loss: 0.0015178367029875517 2023-01-22 20:37:19.898083: step: 1904/530, loss: 0.00015136870206333697 2023-01-22 20:37:20.965330: step: 1908/530, loss: 4.3332940549589694e-05 2023-01-22 20:37:22.039936: step: 1912/530, loss: 7.711160492362978e-07 2023-01-22 20:37:23.102495: step: 1916/530, loss: 0.004623178858309984 2023-01-22 20:37:24.167839: step: 1920/530, loss: 1.5363431884907186e-05 2023-01-22 20:37:25.251693: step: 1924/530, loss: 0.0028751862701028585 2023-01-22 20:37:26.323463: step: 1928/530, loss: 0.00360312731936574 2023-01-22 20:37:27.424385: step: 1932/530, loss: 0.004539411514997482 2023-01-22 20:37:28.526676: step: 1936/530, loss: 0.0032826552633196115 2023-01-22 20:37:29.601570: step: 1940/530, loss: 0.0031021826434880495 2023-01-22 20:37:30.688800: step: 1944/530, loss: 0.003293985966593027 2023-01-22 20:37:31.770890: step: 1948/530, loss: 0.00023466760467272252 2023-01-22 20:37:32.869886: step: 1952/530, loss: 0.010962816886603832 2023-01-22 20:37:33.976541: step: 1956/530, loss: 0.003906755708158016 2023-01-22 20:37:35.051153: step: 1960/530, loss: 0.001585396472364664 2023-01-22 20:37:36.145339: step: 1964/530, loss: 0.0004932558513246477 2023-01-22 20:37:37.251659: step: 1968/530, loss: 0.00801409874111414 2023-01-22 20:37:38.333420: step: 1972/530, loss: 0.002754591405391693 2023-01-22 20:37:39.417150: step: 1976/530, loss: 0.003606868674978614 2023-01-22 20:37:40.525619: step: 1980/530, loss: 0.009220970794558525 2023-01-22 20:37:41.599746: step: 1984/530, loss: 0.0032213402446359396 2023-01-22 20:37:42.681713: step: 1988/530, loss: 0.0016332759987562895 2023-01-22 20:37:43.795984: step: 1992/530, loss: 0.0024386129807680845 2023-01-22 20:37:44.866077: step: 1996/530, loss: 0.006423316430300474 2023-01-22 20:37:45.954530: step: 2000/530, loss: 0.0009003261802718043 2023-01-22 20:37:47.027248: step: 2004/530, loss: 0.0006505006458610296 2023-01-22 20:37:48.123310: step: 2008/530, loss: 0.00021246673713903874 2023-01-22 20:37:49.216419: step: 2012/530, loss: 4.256839474692242e-06 2023-01-22 20:37:50.296219: step: 2016/530, loss: 0.0021003950387239456 2023-01-22 20:37:51.372873: step: 2020/530, loss: 0.011076259426772594 2023-01-22 20:37:52.440575: step: 2024/530, loss: 0.001986247021704912 2023-01-22 20:37:53.504383: step: 2028/530, loss: 2.125672608599416e-06 2023-01-22 20:37:54.594756: step: 2032/530, loss: 0.005149484146386385 2023-01-22 20:37:55.677412: step: 2036/530, loss: 0.004954056814312935 2023-01-22 20:37:56.754819: step: 2040/530, loss: 0.00020679004956036806 2023-01-22 20:37:57.825701: step: 2044/530, loss: 0.0014698265586048365 2023-01-22 20:37:58.910268: step: 2048/530, loss: 0.005000512581318617 2023-01-22 20:38:00.002398: step: 2052/530, loss: 0.002040943130850792 2023-01-22 20:38:01.104879: step: 2056/530, loss: 1.192059789900668e-05 2023-01-22 20:38:02.210690: step: 2060/530, loss: 0.0046931067481637 2023-01-22 20:38:03.291942: step: 2064/530, loss: 5.736005550716072e-05 2023-01-22 20:38:04.392893: step: 2068/530, loss: 0.005970245227217674 2023-01-22 20:38:05.481728: step: 2072/530, loss: 3.0284812964964658e-05 2023-01-22 20:38:06.570386: step: 2076/530, loss: 0.0031871541868895292 2023-01-22 20:38:07.661487: step: 2080/530, loss: 2.6468411306268536e-05 2023-01-22 20:38:08.771749: step: 2084/530, loss: 0.0038185175508260727 2023-01-22 20:38:09.853407: step: 2088/530, loss: 0.0015276194317266345 2023-01-22 20:38:10.947394: step: 2092/530, loss: 0.0023720518220216036 2023-01-22 20:38:12.047141: step: 2096/530, loss: 0.0031994623132050037 2023-01-22 20:38:13.131350: step: 2100/530, loss: 0.0008301698253490031 2023-01-22 20:38:14.236883: step: 2104/530, loss: 0.0036158226430416107 2023-01-22 20:38:15.306329: step: 2108/530, loss: 0.0019475846784189343 2023-01-22 20:38:16.392760: step: 2112/530, loss: 0.004567019175738096 2023-01-22 20:38:17.496259: step: 2116/530, loss: 3.7252898543727042e-09 2023-01-22 20:38:18.576588: step: 2120/530, loss: 0.009466171264648438 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3379255524152107, 'r': 0.35652107617240447, 'f1': 0.34697434375412217}, 'combined': 0.25566530592409, 'stategy': 1, 'epoch': 17} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3293799270517206, 'r': 0.28507164804179574, 'f1': 0.30562824620387646}, 'combined': 0.18981122658977592, 'stategy': 1, 'epoch': 17} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34955593205092494, 'r': 0.3455761681186563, 'f1': 0.347554657630786}, 'combined': 0.25609290562268444, 'stategy': 1, 'epoch': 17} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3195131300644146, 'r': 0.2875934207305809, 'f1': 0.3027141575831518}, 'combined': 0.1880014241832206, 'stategy': 1, 'epoch': 17} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34331208590783885, 'r': 0.32898027207487407, 'f1': 0.33599341740980354}, 'combined': 0.2475740970388026, 'stategy': 1, 'epoch': 17} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34614247010149396, 'r': 0.2965959171254657, 'f1': 0.3194595045700125}, 'combined': 0.19840116599611304, 'stategy': 1, 'epoch': 17} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3138888888888889, 'r': 0.4035714285714286, 'f1': 0.35312499999999997}, 'combined': 0.23541666666666664, 'stategy': 1, 'epoch': 17} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.36363636363636365, 'r': 0.5217391304347826, 'f1': 0.42857142857142855}, 'combined': 0.21428571428571427, 'stategy': 1, 'epoch': 17} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 17} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 18 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 20:40:47.908714: step: 4/530, loss: 0.001717277686111629 2023-01-22 20:40:48.983712: step: 8/530, loss: 0.0006986533990129828 2023-01-22 20:40:50.056577: step: 12/530, loss: 0.0038119065575301647 2023-01-22 20:40:51.157220: step: 16/530, loss: 0.0023736669681966305 2023-01-22 20:40:52.243212: step: 20/530, loss: 0.001824354287236929 2023-01-22 20:40:53.329557: step: 24/530, loss: 0.0007617135415785015 2023-01-22 20:40:54.423399: step: 28/530, loss: 0.005846124608069658 2023-01-22 20:40:55.505768: step: 32/530, loss: 0.006003752816468477 2023-01-22 20:40:56.573008: step: 36/530, loss: 0.0019311968935653567 2023-01-22 20:40:57.651429: step: 40/530, loss: 0.004382942337542772 2023-01-22 20:40:58.766775: step: 44/530, loss: 0.02645988017320633 2023-01-22 20:40:59.826455: step: 48/530, loss: 0.0002333256124984473 2023-01-22 20:41:00.910606: step: 52/530, loss: 0.003416206454858184 2023-01-22 20:41:01.968701: step: 56/530, loss: 0.002360232174396515 2023-01-22 20:41:03.046607: step: 60/530, loss: 7.052139699226245e-05 2023-01-22 20:41:04.117366: step: 64/530, loss: 0.006199215538799763 2023-01-22 20:41:05.229047: step: 68/530, loss: 0.004202813375741243 2023-01-22 20:41:06.306649: step: 72/530, loss: 0.00518175819888711 2023-01-22 20:41:07.386966: step: 76/530, loss: 0.00010874445433728397 2023-01-22 20:41:08.453880: step: 80/530, loss: 4.146892752032727e-05 2023-01-22 20:41:09.564066: step: 84/530, loss: 0.014703149907290936 2023-01-22 20:41:10.628944: step: 88/530, loss: 8.461222023470327e-06 2023-01-22 20:41:11.717456: step: 92/530, loss: 0.004158864729106426 2023-01-22 20:41:12.794045: step: 96/530, loss: 0.0002442148106638342 2023-01-22 20:41:13.868212: step: 100/530, loss: 0.0004288915079087019 2023-01-22 20:41:14.975974: step: 104/530, loss: 0.00298251211643219 2023-01-22 20:41:16.087071: step: 108/530, loss: 0.01544266752898693 2023-01-22 20:41:17.168516: step: 112/530, loss: 0.0002007533039432019 2023-01-22 20:41:18.260852: step: 116/530, loss: 0.000407932122470811 2023-01-22 20:41:19.343483: step: 120/530, loss: 0.00021574630227405578 2023-01-22 20:41:20.425979: step: 124/530, loss: 0.005891435779631138 2023-01-22 20:41:21.529863: step: 128/530, loss: 0.0028573423624038696 2023-01-22 20:41:22.610087: step: 132/530, loss: 0.0019811580423265696 2023-01-22 20:41:23.695227: step: 136/530, loss: 0.0011197433341294527 2023-01-22 20:41:24.770409: step: 140/530, loss: 0.005254335701465607 2023-01-22 20:41:25.840769: step: 144/530, loss: 0.0018295374466106296 2023-01-22 20:41:26.923126: step: 148/530, loss: 0.0001792960101738572 2023-01-22 20:41:28.015356: step: 152/530, loss: 0.004178212024271488 2023-01-22 20:41:29.100843: step: 156/530, loss: 0.02185814082622528 2023-01-22 20:41:30.184691: step: 160/530, loss: 0.005147851537913084 2023-01-22 20:41:31.262254: step: 164/530, loss: 0.0003381682909093797 2023-01-22 20:41:32.339777: step: 168/530, loss: 0.005957733374089003 2023-01-22 20:41:33.411797: step: 172/530, loss: 0.00031117681646719575 2023-01-22 20:41:34.481875: step: 176/530, loss: 9.963851880456787e-06 2023-01-22 20:41:35.586807: step: 180/530, loss: 0.011955692432820797 2023-01-22 20:41:36.669799: step: 184/530, loss: 0.0002807419514283538 2023-01-22 20:41:37.720121: step: 188/530, loss: 0.0031959018670022488 2023-01-22 20:41:38.793177: step: 192/530, loss: 0.006584660150110722 2023-01-22 20:41:39.867138: step: 196/530, loss: 0.000583402463234961 2023-01-22 20:41:40.985903: step: 200/530, loss: 0.0044104475528001785 2023-01-22 20:41:42.110597: step: 204/530, loss: 0.0019759235437959433 2023-01-22 20:41:43.199817: step: 208/530, loss: 5.7586716138757765e-05 2023-01-22 20:41:44.286715: step: 212/530, loss: 7.456469029420987e-05 2023-01-22 20:41:45.397654: step: 216/530, loss: 0.004510125610977411 2023-01-22 20:41:46.461812: step: 220/530, loss: 1.1955972695432138e-05 2023-01-22 20:41:47.557873: step: 224/530, loss: 4.097818528947528e-09 2023-01-22 20:41:48.668065: step: 228/530, loss: 0.00011046500731026754 2023-01-22 20:41:49.736467: step: 232/530, loss: 0.0054216464050114155 2023-01-22 20:41:50.833737: step: 236/530, loss: 0.005629874300211668 2023-01-22 20:41:51.901583: step: 240/530, loss: 0.0001685080205788836 2023-01-22 20:41:52.997170: step: 244/530, loss: 0.0012813311768695712 2023-01-22 20:41:54.065886: step: 248/530, loss: 0.0017779003828763962 2023-01-22 20:41:55.171085: step: 252/530, loss: 1.4218800970411394e-05 2023-01-22 20:41:56.257302: step: 256/530, loss: 0.00031449217931367457 2023-01-22 20:41:57.336584: step: 260/530, loss: 0.000883161264937371 2023-01-22 20:41:58.403403: step: 264/530, loss: 0.004566379357129335 2023-01-22 20:41:59.521420: step: 268/530, loss: 0.00648776488378644 2023-01-22 20:42:00.590034: step: 272/530, loss: 0.00039646675577387214 2023-01-22 20:42:01.668819: step: 276/530, loss: 0.00014451795141212642 2023-01-22 20:42:02.783493: step: 280/530, loss: 0.0019416098948568106 2023-01-22 20:42:03.858232: step: 284/530, loss: 0.0011632838286459446 2023-01-22 20:42:04.951420: step: 288/530, loss: 0.0007095273467712104 2023-01-22 20:42:06.030950: step: 292/530, loss: 0.0007614679052494466 2023-01-22 20:42:07.109358: step: 296/530, loss: 0.0002598889986984432 2023-01-22 20:42:08.204630: step: 300/530, loss: 0.0002933721407316625 2023-01-22 20:42:09.280465: step: 304/530, loss: 0.002365187043324113 2023-01-22 20:42:10.397268: step: 308/530, loss: 0.00019210478058084846 2023-01-22 20:42:11.482014: step: 312/530, loss: 0.011270344257354736 2023-01-22 20:42:12.562604: step: 316/530, loss: 0.00019919799524359405 2023-01-22 20:42:13.625256: step: 320/530, loss: 0.001244648010469973 2023-01-22 20:42:14.725350: step: 324/530, loss: 0.00011213490506634116 2023-01-22 20:42:15.808774: step: 328/530, loss: 0.0009468088974244893 2023-01-22 20:42:16.882401: step: 332/530, loss: 2.9115508368704468e-05 2023-01-22 20:42:17.968280: step: 336/530, loss: 0.0029539279639720917 2023-01-22 20:42:19.066892: step: 340/530, loss: 0.0009108154918067157 2023-01-22 20:42:20.149279: step: 344/530, loss: 0.00022972917940933257 2023-01-22 20:42:21.236407: step: 348/530, loss: 2.0186087567708455e-05 2023-01-22 20:42:22.318747: step: 352/530, loss: 0.00953727774322033 2023-01-22 20:42:23.394628: step: 356/530, loss: 0.0020959770772606134 2023-01-22 20:42:24.455559: step: 360/530, loss: 0.001370947458781302 2023-01-22 20:42:25.544419: step: 364/530, loss: 7.094330794643611e-05 2023-01-22 20:42:26.638011: step: 368/530, loss: 0.005751086864620447 2023-01-22 20:42:27.727232: step: 372/530, loss: 0.0019651406910270452 2023-01-22 20:42:28.820305: step: 376/530, loss: 0.0029390938580036163 2023-01-22 20:42:29.905527: step: 380/530, loss: 0.0006309486925601959 2023-01-22 20:42:30.993106: step: 384/530, loss: 0.0006725346902385354 2023-01-22 20:42:32.080779: step: 388/530, loss: 0.000701945973560214 2023-01-22 20:42:33.174706: step: 392/530, loss: 0.0005636418936774135 2023-01-22 20:42:34.288137: step: 396/530, loss: 0.0036305224057286978 2023-01-22 20:42:35.396637: step: 400/530, loss: 0.0026129111647605896 2023-01-22 20:42:36.470962: step: 404/530, loss: 0.0016736896941438317 2023-01-22 20:42:37.560914: step: 408/530, loss: 0.0032366346567869186 2023-01-22 20:42:38.635683: step: 412/530, loss: 0.010163509286940098 2023-01-22 20:42:39.713030: step: 416/530, loss: 0.0008702895138412714 2023-01-22 20:42:40.792957: step: 420/530, loss: 0.01142034586519003 2023-01-22 20:42:41.874691: step: 424/530, loss: 0.00237711681984365 2023-01-22 20:42:42.981470: step: 428/530, loss: 0.00505759147927165 2023-01-22 20:42:44.054084: step: 432/530, loss: 0.006024437490850687 2023-01-22 20:42:45.125657: step: 436/530, loss: 0.008693150244653225 2023-01-22 20:42:46.215477: step: 440/530, loss: 0.00016724682063795626 2023-01-22 20:42:47.297536: step: 444/530, loss: 6.383230356732383e-05 2023-01-22 20:42:48.382101: step: 448/530, loss: 0.0015097310533747077 2023-01-22 20:42:49.481474: step: 452/530, loss: 0.011982501484453678 2023-01-22 20:42:50.560883: step: 456/530, loss: 2.5591793928469997e-07 2023-01-22 20:42:51.650358: step: 460/530, loss: 0.0001620101393200457 2023-01-22 20:42:52.735255: step: 464/530, loss: 8.83015600265935e-05 2023-01-22 20:42:53.823032: step: 468/530, loss: 0.004646714311093092 2023-01-22 20:42:54.914410: step: 472/530, loss: 0.000592630822211504 2023-01-22 20:42:56.002491: step: 476/530, loss: 0.005837602540850639 2023-01-22 20:42:57.098901: step: 480/530, loss: 0.004000914748758078 2023-01-22 20:42:58.178993: step: 484/530, loss: 0.012194002978503704 2023-01-22 20:42:59.251486: step: 488/530, loss: 0.008404335007071495 2023-01-22 20:43:00.342616: step: 492/530, loss: 0.00016589769802521914 2023-01-22 20:43:01.446588: step: 496/530, loss: 6.875131657579914e-05 2023-01-22 20:43:02.526952: step: 500/530, loss: 0.00075691775418818 2023-01-22 20:43:03.636315: step: 504/530, loss: 0.031414587050676346 2023-01-22 20:43:04.740122: step: 508/530, loss: 0.0012252414599061012 2023-01-22 20:43:05.814131: step: 512/530, loss: 0.020032024011015892 2023-01-22 20:43:06.897342: step: 516/530, loss: 0.012250245548784733 2023-01-22 20:43:07.992925: step: 520/530, loss: 0.004050903487950563 2023-01-22 20:43:09.089983: step: 524/530, loss: 0.004247687291353941 2023-01-22 20:43:10.186800: step: 528/530, loss: 0.0035304396878927946 2023-01-22 20:43:11.286629: step: 532/530, loss: 0.007886233739554882 2023-01-22 20:43:12.404776: step: 536/530, loss: 0.006331183947622776 2023-01-22 20:43:13.511945: step: 540/530, loss: 0.013163681142032146 2023-01-22 20:43:14.593216: step: 544/530, loss: 0.0005475817015394568 2023-01-22 20:43:15.658438: step: 548/530, loss: 0.0004599393578246236 2023-01-22 20:43:16.730676: step: 552/530, loss: 0.0010365445632487535 2023-01-22 20:43:17.803943: step: 556/530, loss: 1.4423936590901576e-05 2023-01-22 20:43:18.887324: step: 560/530, loss: 1.5923005776130594e-05 2023-01-22 20:43:19.964060: step: 564/530, loss: 0.0003931539540644735 2023-01-22 20:43:21.076535: step: 568/530, loss: 0.0009414428495801985 2023-01-22 20:43:22.180820: step: 572/530, loss: 4.491058007261017e-06 2023-01-22 20:43:23.324390: step: 576/530, loss: 0.0037829342763870955 2023-01-22 20:43:24.406729: step: 580/530, loss: 8.805045217741281e-05 2023-01-22 20:43:25.478481: step: 584/530, loss: 4.563278821478889e-07 2023-01-22 20:43:26.573221: step: 588/530, loss: 0.00023557775421068072 2023-01-22 20:43:27.681394: step: 592/530, loss: 0.004916893783956766 2023-01-22 20:43:28.770372: step: 596/530, loss: 0.00038089865120127797 2023-01-22 20:43:29.879016: step: 600/530, loss: 0.004265580326318741 2023-01-22 20:43:30.988990: step: 604/530, loss: 0.004831551108509302 2023-01-22 20:43:32.090650: step: 608/530, loss: 0.0020402439404278994 2023-01-22 20:43:33.195768: step: 612/530, loss: 0.0008778349729254842 2023-01-22 20:43:34.275282: step: 616/530, loss: 0.0028767564799636602 2023-01-22 20:43:35.387987: step: 620/530, loss: 0.0036349743604660034 2023-01-22 20:43:36.490174: step: 624/530, loss: 0.0032440037466585636 2023-01-22 20:43:37.572597: step: 628/530, loss: 0.0046727824956178665 2023-01-22 20:43:38.640260: step: 632/530, loss: 0.002169714542105794 2023-01-22 20:43:39.712880: step: 636/530, loss: 0.0023315646685659885 2023-01-22 20:43:40.803805: step: 640/530, loss: 0.0004691978101618588 2023-01-22 20:43:41.903482: step: 644/530, loss: 0.0013867220841348171 2023-01-22 20:43:42.974176: step: 648/530, loss: 3.5058568755630404e-05 2023-01-22 20:43:44.055753: step: 652/530, loss: 0.0002541353169362992 2023-01-22 20:43:45.153949: step: 656/530, loss: 0.0025046151131391525 2023-01-22 20:43:46.233297: step: 660/530, loss: 4.2849565943470225e-05 2023-01-22 20:43:47.337953: step: 664/530, loss: 0.00032935856143012643 2023-01-22 20:43:48.413906: step: 668/530, loss: 0.00035427865805104375 2023-01-22 20:43:49.506251: step: 672/530, loss: 0.007320267613977194 2023-01-22 20:43:50.585676: step: 676/530, loss: 0.0018458595732226968 2023-01-22 20:43:51.655141: step: 680/530, loss: 0.0025820601731538773 2023-01-22 20:43:52.741048: step: 684/530, loss: 0.0017484494019299746 2023-01-22 20:43:53.807876: step: 688/530, loss: 0.0017654402181506157 2023-01-22 20:43:54.884779: step: 692/530, loss: 0.004032533150166273 2023-01-22 20:43:55.940194: step: 696/530, loss: 0.00021393563656602055 2023-01-22 20:43:57.015285: step: 700/530, loss: 0.0020914871711283922 2023-01-22 20:43:58.088778: step: 704/530, loss: 0.0003192913136444986 2023-01-22 20:43:59.151175: step: 708/530, loss: 0.0001073602688848041 2023-01-22 20:44:00.219956: step: 712/530, loss: 0.0015706164995208383 2023-01-22 20:44:01.310718: step: 716/530, loss: 0.002007235074415803 2023-01-22 20:44:02.408601: step: 720/530, loss: 0.0016504325903952122 2023-01-22 20:44:03.515017: step: 724/530, loss: 0.0013440509792417288 2023-01-22 20:44:04.613603: step: 728/530, loss: 0.004388183355331421 2023-01-22 20:44:05.699780: step: 732/530, loss: 0.004481877200305462 2023-01-22 20:44:06.789567: step: 736/530, loss: 0.003275747410953045 2023-01-22 20:44:07.863408: step: 740/530, loss: 4.967485074303113e-05 2023-01-22 20:44:08.949920: step: 744/530, loss: 0.0021200755145400763 2023-01-22 20:44:10.032982: step: 748/530, loss: 5.9789403167087585e-05 2023-01-22 20:44:11.119217: step: 752/530, loss: 0.001000691088847816 2023-01-22 20:44:12.189857: step: 756/530, loss: 0.00037946488009765744 2023-01-22 20:44:13.304957: step: 760/530, loss: 0.000272397039225325 2023-01-22 20:44:14.410617: step: 764/530, loss: 0.005482069682329893 2023-01-22 20:44:15.503500: step: 768/530, loss: 0.0014439367223531008 2023-01-22 20:44:16.599806: step: 772/530, loss: 0.00023551311460323632 2023-01-22 20:44:17.689922: step: 776/530, loss: 0.00016074276936706156 2023-01-22 20:44:18.769429: step: 780/530, loss: 0.00014413455210160464 2023-01-22 20:44:19.849924: step: 784/530, loss: 0.006376531440764666 2023-01-22 20:44:20.936739: step: 788/530, loss: 0.0004619788669515401 2023-01-22 20:44:22.033224: step: 792/530, loss: 5.243196937954053e-05 2023-01-22 20:44:23.118082: step: 796/530, loss: 8.521234121872112e-05 2023-01-22 20:44:24.225631: step: 800/530, loss: 0.001080823945812881 2023-01-22 20:44:25.302474: step: 804/530, loss: 3.813042712863535e-05 2023-01-22 20:44:26.374249: step: 808/530, loss: 0.0030335320625454187 2023-01-22 20:44:27.458358: step: 812/530, loss: 0.0039006578736007214 2023-01-22 20:44:28.560331: step: 816/530, loss: 0.0016806074418127537 2023-01-22 20:44:29.654746: step: 820/530, loss: 0.01914094388484955 2023-01-22 20:44:30.747235: step: 824/530, loss: 0.003452296368777752 2023-01-22 20:44:31.825425: step: 828/530, loss: 0.0002554992097429931 2023-01-22 20:44:32.917152: step: 832/530, loss: 0.0012343236012384295 2023-01-22 20:44:33.991308: step: 836/530, loss: 0.0031420369632542133 2023-01-22 20:44:35.093565: step: 840/530, loss: 0.0022533959709107876 2023-01-22 20:44:36.198020: step: 844/530, loss: 0.0020250931847840548 2023-01-22 20:44:37.302850: step: 848/530, loss: 0.0014053195482119918 2023-01-22 20:44:38.396253: step: 852/530, loss: 0.0019668361637741327 2023-01-22 20:44:39.498766: step: 856/530, loss: 0.001912312232889235 2023-01-22 20:44:40.574125: step: 860/530, loss: 0.002343566855415702 2023-01-22 20:44:41.652051: step: 864/530, loss: 0.0036152235697954893 2023-01-22 20:44:42.726215: step: 868/530, loss: 0.003888618666678667 2023-01-22 20:44:43.804717: step: 872/530, loss: 0.0 2023-01-22 20:44:44.922504: step: 876/530, loss: 0.009707119315862656 2023-01-22 20:44:46.020794: step: 880/530, loss: 0.00782280694693327 2023-01-22 20:44:47.124376: step: 884/530, loss: 0.002724698279052973 2023-01-22 20:44:48.192772: step: 888/530, loss: 5.1082268328173086e-05 2023-01-22 20:44:49.275221: step: 892/530, loss: 0.0023005264811217785 2023-01-22 20:44:50.381319: step: 896/530, loss: 5.8825709857046604e-05 2023-01-22 20:44:51.467587: step: 900/530, loss: 0.0072162458673119545 2023-01-22 20:44:52.565412: step: 904/530, loss: 0.00029325688956305385 2023-01-22 20:44:53.646609: step: 908/530, loss: 0.0022310204803943634 2023-01-22 20:44:54.747336: step: 912/530, loss: 0.000991170178167522 2023-01-22 20:44:55.834002: step: 916/530, loss: 0.002493495587259531 2023-01-22 20:44:56.901533: step: 920/530, loss: 0.006371739786118269 2023-01-22 20:44:57.993822: step: 924/530, loss: 0.01080137025564909 2023-01-22 20:44:59.085905: step: 928/530, loss: 4.840054316446185e-06 2023-01-22 20:45:00.174700: step: 932/530, loss: 0.0035445194225758314 2023-01-22 20:45:01.250441: step: 936/530, loss: 0.0018409241456538439 2023-01-22 20:45:02.331867: step: 940/530, loss: 0.0011638402938842773 2023-01-22 20:45:03.406925: step: 944/530, loss: 0.004288491792976856 2023-01-22 20:45:04.476721: step: 948/530, loss: 0.0004601738473866135 2023-01-22 20:45:05.585465: step: 952/530, loss: 0.0036804615519940853 2023-01-22 20:45:06.664877: step: 956/530, loss: 0.001864671939983964 2023-01-22 20:45:07.757237: step: 960/530, loss: 0.007566457148641348 2023-01-22 20:45:08.850562: step: 964/530, loss: 3.502176332403906e-05 2023-01-22 20:45:09.943949: step: 968/530, loss: 0.011312774382531643 2023-01-22 20:45:11.015576: step: 972/530, loss: 0.006206408608704805 2023-01-22 20:45:12.119046: step: 976/530, loss: 0.0005008551524952054 2023-01-22 20:45:13.228322: step: 980/530, loss: 0.0017643271712586284 2023-01-22 20:45:14.341023: step: 984/530, loss: 0.0022599254734814167 2023-01-22 20:45:15.447313: step: 988/530, loss: 0.0014045790303498507 2023-01-22 20:45:16.513735: step: 992/530, loss: 0.0003754697390832007 2023-01-22 20:45:17.587415: step: 996/530, loss: 0.0025966197717934847 2023-01-22 20:45:18.693490: step: 1000/530, loss: 0.0059115388430655 2023-01-22 20:45:19.763779: step: 1004/530, loss: 0.004008471965789795 2023-01-22 20:45:20.856604: step: 1008/530, loss: 0.006558794528245926 2023-01-22 20:45:21.957041: step: 1012/530, loss: 0.0057535069063305855 2023-01-22 20:45:23.044991: step: 1016/530, loss: 0.0027343512047082186 2023-01-22 20:45:24.143350: step: 1020/530, loss: 0.00018126910435967147 2023-01-22 20:45:25.218688: step: 1024/530, loss: 0.010294582694768906 2023-01-22 20:45:26.295985: step: 1028/530, loss: 0.0003243729879613966 2023-01-22 20:45:27.413592: step: 1032/530, loss: 4.505300967139192e-05 2023-01-22 20:45:28.500019: step: 1036/530, loss: 0.0020992967765778303 2023-01-22 20:45:29.577249: step: 1040/530, loss: 0.001721567357890308 2023-01-22 20:45:30.663385: step: 1044/530, loss: 0.00028687919257208705 2023-01-22 20:45:31.771349: step: 1048/530, loss: 0.0028847442008554935 2023-01-22 20:45:32.867129: step: 1052/530, loss: 0.0002744919911492616 2023-01-22 20:45:33.940948: step: 1056/530, loss: 0.004789954517036676 2023-01-22 20:45:35.041993: step: 1060/530, loss: 0.0001996932114707306 2023-01-22 20:45:36.124818: step: 1064/530, loss: 0.002991387154906988 2023-01-22 20:45:37.213778: step: 1068/530, loss: 0.0013041590573266149 2023-01-22 20:45:38.324290: step: 1072/530, loss: 0.0009976651053875685 2023-01-22 20:45:39.404367: step: 1076/530, loss: 0.0003664449031930417 2023-01-22 20:45:40.490792: step: 1080/530, loss: 0.003211794886738062 2023-01-22 20:45:41.607984: step: 1084/530, loss: 0.0015634378651157022 2023-01-22 20:45:42.677129: step: 1088/530, loss: 0.00016998103819787502 2023-01-22 20:45:43.749254: step: 1092/530, loss: 0.00010231405030936003 2023-01-22 20:45:44.843106: step: 1096/530, loss: 2.615609992062673e-05 2023-01-22 20:45:45.923043: step: 1100/530, loss: 4.504331809584983e-05 2023-01-22 20:45:46.983027: step: 1104/530, loss: 0.00014758470933884382 2023-01-22 20:45:48.063606: step: 1108/530, loss: 0.00011001220991602167 2023-01-22 20:45:49.162755: step: 1112/530, loss: 0.01595516875386238 2023-01-22 20:45:50.234828: step: 1116/530, loss: 0.00031333856168203056 2023-01-22 20:45:51.317364: step: 1120/530, loss: 0.0019532975275069475 2023-01-22 20:45:52.412585: step: 1124/530, loss: 0.002874934347346425 2023-01-22 20:45:53.497510: step: 1128/530, loss: 0.0022516525350511074 2023-01-22 20:45:54.579137: step: 1132/530, loss: 0.0005060546100139618 2023-01-22 20:45:55.673976: step: 1136/530, loss: 0.0005739081534557045 2023-01-22 20:45:56.760548: step: 1140/530, loss: 0.0012365446891635656 2023-01-22 20:45:57.873441: step: 1144/530, loss: 0.019276412203907967 2023-01-22 20:45:58.939586: step: 1148/530, loss: 0.0014636055566370487 2023-01-22 20:46:00.048954: step: 1152/530, loss: 0.003789471462368965 2023-01-22 20:46:01.136021: step: 1156/530, loss: 0.0028425180353224277 2023-01-22 20:46:02.218448: step: 1160/530, loss: 0.0035149287432432175 2023-01-22 20:46:03.314451: step: 1164/530, loss: 0.0031245313584804535 2023-01-22 20:46:04.407085: step: 1168/530, loss: 0.00384851498529315 2023-01-22 20:46:05.500895: step: 1172/530, loss: 0.00021501992887351662 2023-01-22 20:46:06.593850: step: 1176/530, loss: 0.0034433945547789335 2023-01-22 20:46:07.678529: step: 1180/530, loss: 0.007750116754323244 2023-01-22 20:46:08.761467: step: 1184/530, loss: 0.000263664813246578 2023-01-22 20:46:09.878728: step: 1188/530, loss: 0.003954093437641859 2023-01-22 20:46:10.952217: step: 1192/530, loss: 2.8115797249483876e-05 2023-01-22 20:46:12.070483: step: 1196/530, loss: 0.00457800505682826 2023-01-22 20:46:13.129602: step: 1200/530, loss: 0.0010012646671384573 2023-01-22 20:46:14.218795: step: 1204/530, loss: 2.460063797116163e-06 2023-01-22 20:46:15.296828: step: 1208/530, loss: 1.3038495616513046e-08 2023-01-22 20:46:16.386768: step: 1212/530, loss: 8.966604218585417e-05 2023-01-22 20:46:17.457694: step: 1216/530, loss: 3.9777263737050816e-05 2023-01-22 20:46:18.539548: step: 1220/530, loss: 6.475103873526677e-05 2023-01-22 20:46:19.632891: step: 1224/530, loss: 0.003936760127544403 2023-01-22 20:46:20.721603: step: 1228/530, loss: 0.005309733096510172 2023-01-22 20:46:21.793541: step: 1232/530, loss: 3.902622847817838e-05 2023-01-22 20:46:22.888586: step: 1236/530, loss: 0.007171180564910173 2023-01-22 20:46:23.973290: step: 1240/530, loss: 0.0013217878295108676 2023-01-22 20:46:25.050880: step: 1244/530, loss: 0.0026664354372769594 2023-01-22 20:46:26.120244: step: 1248/530, loss: 5.535219679586589e-05 2023-01-22 20:46:27.209312: step: 1252/530, loss: 0.004173062276095152 2023-01-22 20:46:28.299621: step: 1256/530, loss: 0.000889939779881388 2023-01-22 20:46:29.375462: step: 1260/530, loss: 0.001878840266726911 2023-01-22 20:46:30.464808: step: 1264/530, loss: 0.00019303134467918426 2023-01-22 20:46:31.534370: step: 1268/530, loss: 0.0058050015941262245 2023-01-22 20:46:32.611292: step: 1272/530, loss: 0.0011189930373802781 2023-01-22 20:46:33.697879: step: 1276/530, loss: 0.0022181409876793623 2023-01-22 20:46:34.791509: step: 1280/530, loss: 0.0009613332222215831 2023-01-22 20:46:35.873909: step: 1284/530, loss: 0.0007159464876167476 2023-01-22 20:46:36.976932: step: 1288/530, loss: 0.0017143894219771028 2023-01-22 20:46:38.079565: step: 1292/530, loss: 0.006154817063361406 2023-01-22 20:46:39.168966: step: 1296/530, loss: 0.007152739446610212 2023-01-22 20:46:40.289437: step: 1300/530, loss: 0.0021627964451909065 2023-01-22 20:46:41.381488: step: 1304/530, loss: 0.001702772919088602 2023-01-22 20:46:42.462187: step: 1308/530, loss: 6.095332082622917e-06 2023-01-22 20:46:43.563703: step: 1312/530, loss: 0.0044060563668608665 2023-01-22 20:46:44.667137: step: 1316/530, loss: 0.00379826663993299 2023-01-22 20:46:45.745822: step: 1320/530, loss: 0.0015721842646598816 2023-01-22 20:46:46.822353: step: 1324/530, loss: 0.002565699862316251 2023-01-22 20:46:47.923408: step: 1328/530, loss: 0.0025266525335609913 2023-01-22 20:46:49.014886: step: 1332/530, loss: 0.0022809526417404413 2023-01-22 20:46:50.112986: step: 1336/530, loss: 0.0002023878914769739 2023-01-22 20:46:51.177767: step: 1340/530, loss: 0.00039393187034875154 2023-01-22 20:46:52.279699: step: 1344/530, loss: 8.490855179843493e-06 2023-01-22 20:46:53.400450: step: 1348/530, loss: 0.0012715040938928723 2023-01-22 20:46:54.475282: step: 1352/530, loss: 0.0033437812235206366 2023-01-22 20:46:55.609167: step: 1356/530, loss: 0.0026764723006635904 2023-01-22 20:46:56.719790: step: 1360/530, loss: 0.0018067383207380772 2023-01-22 20:46:57.829632: step: 1364/530, loss: 0.0024920664727687836 2023-01-22 20:46:58.918160: step: 1368/530, loss: 7.260068377945572e-05 2023-01-22 20:47:00.018648: step: 1372/530, loss: 0.004392989445477724 2023-01-22 20:47:01.100835: step: 1376/530, loss: 0.007284869905561209 2023-01-22 20:47:02.190805: step: 1380/530, loss: 0.0025853365659713745 2023-01-22 20:47:03.278455: step: 1384/530, loss: 0.0006087161600589752 2023-01-22 20:47:04.353228: step: 1388/530, loss: 2.4609207684989087e-05 2023-01-22 20:47:05.432047: step: 1392/530, loss: 1.7088406821130775e-05 2023-01-22 20:47:06.518616: step: 1396/530, loss: 0.00859412457793951 2023-01-22 20:47:07.598256: step: 1400/530, loss: 0.0019435868598520756 2023-01-22 20:47:08.681108: step: 1404/530, loss: 0.0019388190703466535 2023-01-22 20:47:09.773017: step: 1408/530, loss: 1.255468487215694e-05 2023-01-22 20:47:10.864603: step: 1412/530, loss: 0.00016437396698165685 2023-01-22 20:47:11.949726: step: 1416/530, loss: 0.0015550577081739902 2023-01-22 20:47:13.028067: step: 1420/530, loss: 0.00014448219735641032 2023-01-22 20:47:14.110253: step: 1424/530, loss: 0.0019296086393296719 2023-01-22 20:47:15.193645: step: 1428/530, loss: 0.0006081080064177513 2023-01-22 20:47:16.274159: step: 1432/530, loss: 0.0021067133639007807 2023-01-22 20:47:17.356575: step: 1436/530, loss: 0.002325301757082343 2023-01-22 20:47:18.425126: step: 1440/530, loss: 0.0014245351776480675 2023-01-22 20:47:19.511951: step: 1444/530, loss: 5.2530690481944475e-06 2023-01-22 20:47:20.581764: step: 1448/530, loss: 0.0013785141054540873 2023-01-22 20:47:21.669661: step: 1452/530, loss: 0.00266665150411427 2023-01-22 20:47:22.743945: step: 1456/530, loss: 0.00010153292532777414 2023-01-22 20:47:23.832205: step: 1460/530, loss: 0.010531317442655563 2023-01-22 20:47:24.934899: step: 1464/530, loss: 0.005117565393447876 2023-01-22 20:47:26.035720: step: 1468/530, loss: 0.0026795787271112204 2023-01-22 20:47:27.138882: step: 1472/530, loss: 0.004253399092704058 2023-01-22 20:47:28.236889: step: 1476/530, loss: 0.006138286553323269 2023-01-22 20:47:29.316643: step: 1480/530, loss: 0.001985726645216346 2023-01-22 20:47:30.394224: step: 1484/530, loss: 0.0009818169055506587 2023-01-22 20:47:31.486981: step: 1488/530, loss: 0.0020236035343259573 2023-01-22 20:47:32.571902: step: 1492/530, loss: 0.0019806043710559607 2023-01-22 20:47:33.660406: step: 1496/530, loss: 0.007451156619936228 2023-01-22 20:47:34.736882: step: 1500/530, loss: 0.0007054515881463885 2023-01-22 20:47:35.808778: step: 1504/530, loss: 0.0030755724292248487 2023-01-22 20:47:36.908760: step: 1508/530, loss: 0.005066622514277697 2023-01-22 20:47:38.010156: step: 1512/530, loss: 0.006008957978338003 2023-01-22 20:47:39.079915: step: 1516/530, loss: 0.013087806291878223 2023-01-22 20:47:40.159762: step: 1520/530, loss: 0.001419123844243586 2023-01-22 20:47:41.251691: step: 1524/530, loss: 0.0009964581113308668 2023-01-22 20:47:42.358072: step: 1528/530, loss: 0.00013537734048441052 2023-01-22 20:47:43.424293: step: 1532/530, loss: 0.0027017153333872557 2023-01-22 20:47:44.495300: step: 1536/530, loss: 0.0010289069032296538 2023-01-22 20:47:45.566694: step: 1540/530, loss: 4.0146969695342705e-05 2023-01-22 20:47:46.645673: step: 1544/530, loss: 0.0018527734791859984 2023-01-22 20:47:47.732218: step: 1548/530, loss: 0.00414172001183033 2023-01-22 20:47:48.811877: step: 1552/530, loss: 0.0004370535025373101 2023-01-22 20:47:49.917984: step: 1556/530, loss: 0.0009930988308042288 2023-01-22 20:47:51.016731: step: 1560/530, loss: 0.0015663818921893835 2023-01-22 20:47:52.090180: step: 1564/530, loss: 0.007728134747594595 2023-01-22 20:47:53.175722: step: 1568/530, loss: 0.009619293734431267 2023-01-22 20:47:54.262805: step: 1572/530, loss: 0.00032079138327389956 2023-01-22 20:47:55.327753: step: 1576/530, loss: 0.000599631923250854 2023-01-22 20:47:56.420244: step: 1580/530, loss: 0.005323352292180061 2023-01-22 20:47:57.524734: step: 1584/530, loss: 0.0011103095021098852 2023-01-22 20:47:58.595484: step: 1588/530, loss: 1.4017600733495783e-06 2023-01-22 20:47:59.701556: step: 1592/530, loss: 0.0024874003138393164 2023-01-22 20:48:00.840985: step: 1596/530, loss: 0.005891331937164068 2023-01-22 20:48:01.937176: step: 1600/530, loss: 0.005847080610692501 2023-01-22 20:48:03.010745: step: 1604/530, loss: 0.0019826064817607403 2023-01-22 20:48:04.086165: step: 1608/530, loss: 0.01145973801612854 2023-01-22 20:48:05.186490: step: 1612/530, loss: 0.001424646470695734 2023-01-22 20:48:06.281598: step: 1616/530, loss: 0.003142877947539091 2023-01-22 20:48:07.350746: step: 1620/530, loss: 3.783239299082197e-05 2023-01-22 20:48:08.433901: step: 1624/530, loss: 0.004596029408276081 2023-01-22 20:48:09.521779: step: 1628/530, loss: 0.003456001402810216 2023-01-22 20:48:10.586126: step: 1632/530, loss: 6.610665082007472e-07 2023-01-22 20:48:11.674203: step: 1636/530, loss: 0.0001403927308274433 2023-01-22 20:48:12.795206: step: 1640/530, loss: 0.003840002231299877 2023-01-22 20:48:13.890395: step: 1644/530, loss: 0.0008944791625253856 2023-01-22 20:48:14.980716: step: 1648/530, loss: 0.004717118572443724 2023-01-22 20:48:16.073287: step: 1652/530, loss: 0.00012440640421118587 2023-01-22 20:48:17.159342: step: 1656/530, loss: 0.0014180088182911277 2023-01-22 20:48:18.255540: step: 1660/530, loss: 0.004750819411128759 2023-01-22 20:48:19.349903: step: 1664/530, loss: 0.0017868034774437547 2023-01-22 20:48:20.444735: step: 1668/530, loss: 0.0012775957584381104 2023-01-22 20:48:21.536267: step: 1672/530, loss: 0.0031952436547726393 2023-01-22 20:48:22.601801: step: 1676/530, loss: 2.72011475317413e-05 2023-01-22 20:48:23.697921: step: 1680/530, loss: 0.003033621469512582 2023-01-22 20:48:24.776366: step: 1684/530, loss: 0.00031308206962421536 2023-01-22 20:48:25.831622: step: 1688/530, loss: 4.836493098991923e-05 2023-01-22 20:48:26.941185: step: 1692/530, loss: 7.271373033290729e-05 2023-01-22 20:48:28.029963: step: 1696/530, loss: 0.0001186248628073372 2023-01-22 20:48:29.122340: step: 1700/530, loss: 0.002530114259570837 2023-01-22 20:48:30.207359: step: 1704/530, loss: 0.0020812377333641052 2023-01-22 20:48:31.271959: step: 1708/530, loss: 0.010340622626245022 2023-01-22 20:48:32.353135: step: 1712/530, loss: 0.0002444394340272993 2023-01-22 20:48:33.430246: step: 1716/530, loss: 0.003982409369200468 2023-01-22 20:48:34.522530: step: 1720/530, loss: 3.0109549697954208e-05 2023-01-22 20:48:35.621114: step: 1724/530, loss: 0.0016302644507959485 2023-01-22 20:48:36.711707: step: 1728/530, loss: 0.0005931056221015751 2023-01-22 20:48:37.790981: step: 1732/530, loss: 2.019263547481387e-06 2023-01-22 20:48:38.860232: step: 1736/530, loss: 0.0008689704118296504 2023-01-22 20:48:39.952945: step: 1740/530, loss: 0.0008405217085964978 2023-01-22 20:48:41.022357: step: 1744/530, loss: 2.7922547815251164e-05 2023-01-22 20:48:42.110737: step: 1748/530, loss: 7.264497253345326e-05 2023-01-22 20:48:43.181688: step: 1752/530, loss: 0.00038379195029847324 2023-01-22 20:48:44.270636: step: 1756/530, loss: 0.0009625382372178137 2023-01-22 20:48:45.355122: step: 1760/530, loss: 0.0002641146711539477 2023-01-22 20:48:46.460572: step: 1764/530, loss: 0.009809155017137527 2023-01-22 20:48:47.525559: step: 1768/530, loss: 0.00038203957956284285 2023-01-22 20:48:48.604668: step: 1772/530, loss: 0.010345851071178913 2023-01-22 20:48:49.685467: step: 1776/530, loss: 0.0003978973545599729 2023-01-22 20:48:50.776624: step: 1780/530, loss: 0.003386878641322255 2023-01-22 20:48:51.852244: step: 1784/530, loss: 0.0001284680183744058 2023-01-22 20:48:52.946960: step: 1788/530, loss: 0.0014040580717846751 2023-01-22 20:48:54.024455: step: 1792/530, loss: 6.557555752806365e-05 2023-01-22 20:48:55.120079: step: 1796/530, loss: 0.0044130305759608746 2023-01-22 20:48:56.199757: step: 1800/530, loss: 0.0013103386154398322 2023-01-22 20:48:57.298360: step: 1804/530, loss: 0.0015345969004556537 2023-01-22 20:48:58.377504: step: 1808/530, loss: 0.004855201579630375 2023-01-22 20:48:59.463694: step: 1812/530, loss: 0.016004931181669235 2023-01-22 20:49:00.574944: step: 1816/530, loss: 0.001297872862778604 2023-01-22 20:49:01.676365: step: 1820/530, loss: 0.005055380053818226 2023-01-22 20:49:02.757406: step: 1824/530, loss: 0.00018071664089802653 2023-01-22 20:49:03.864606: step: 1828/530, loss: 0.0075599090196192265 2023-01-22 20:49:04.969872: step: 1832/530, loss: 0.0034981267526745796 2023-01-22 20:49:06.049152: step: 1836/530, loss: 0.0011073533678427339 2023-01-22 20:49:07.134104: step: 1840/530, loss: 0.0015231224242597818 2023-01-22 20:49:08.218505: step: 1844/530, loss: 0.0038231462240219116 2023-01-22 20:49:09.320448: step: 1848/530, loss: 0.0004272600053809583 2023-01-22 20:49:10.399790: step: 1852/530, loss: 0.0017785176169127226 2023-01-22 20:49:11.479844: step: 1856/530, loss: 2.09951735996583e-06 2023-01-22 20:49:12.563495: step: 1860/530, loss: 0.0006456903065554798 2023-01-22 20:49:13.656371: step: 1864/530, loss: 0.00011082401033490896 2023-01-22 20:49:14.755656: step: 1868/530, loss: 0.0009531215182505548 2023-01-22 20:49:15.838626: step: 1872/530, loss: 0.00011759912013076246 2023-01-22 20:49:16.921492: step: 1876/530, loss: 0.006264088209718466 2023-01-22 20:49:18.015725: step: 1880/530, loss: 0.012948942370712757 2023-01-22 20:49:19.089204: step: 1884/530, loss: 0.0030248446855694056 2023-01-22 20:49:20.169755: step: 1888/530, loss: 2.8554763048305176e-05 2023-01-22 20:49:21.240640: step: 1892/530, loss: 1.4335214473248925e-05 2023-01-22 20:49:22.322701: step: 1896/530, loss: 0.004100819118320942 2023-01-22 20:49:23.402642: step: 1900/530, loss: 0.0008017533691599965 2023-01-22 20:49:24.473102: step: 1904/530, loss: 0.0006815269589424133 2023-01-22 20:49:25.563527: step: 1908/530, loss: 0.003955672029405832 2023-01-22 20:49:26.651219: step: 1912/530, loss: 0.005318224895745516 2023-01-22 20:49:27.742707: step: 1916/530, loss: 0.00162272690795362 2023-01-22 20:49:28.827317: step: 1920/530, loss: 0.004056726116687059 2023-01-22 20:49:29.902442: step: 1924/530, loss: 0.005189417861402035 2023-01-22 20:49:30.994835: step: 1928/530, loss: 0.003656966844573617 2023-01-22 20:49:32.094727: step: 1932/530, loss: 0.0036018837708979845 2023-01-22 20:49:33.178883: step: 1936/530, loss: 0.02192796766757965 2023-01-22 20:49:34.246807: step: 1940/530, loss: 5.364325943446602e-07 2023-01-22 20:49:35.338188: step: 1944/530, loss: 0.003181676845997572 2023-01-22 20:49:36.422883: step: 1948/530, loss: 0.004406286869198084 2023-01-22 20:49:37.514976: step: 1952/530, loss: 0.008195783942937851 2023-01-22 20:49:38.616781: step: 1956/530, loss: 0.0002161364973289892 2023-01-22 20:49:39.717362: step: 1960/530, loss: 0.014707427471876144 2023-01-22 20:49:40.788504: step: 1964/530, loss: 0.0008810496656224132 2023-01-22 20:49:41.901639: step: 1968/530, loss: 0.004724032245576382 2023-01-22 20:49:42.985236: step: 1972/530, loss: 0.0021628988906741142 2023-01-22 20:49:44.091404: step: 1976/530, loss: 0.012636066414415836 2023-01-22 20:49:45.171301: step: 1980/530, loss: 0.0006995893199928105 2023-01-22 20:49:46.229288: step: 1984/530, loss: 0.0028340821154415607 2023-01-22 20:49:47.312842: step: 1988/530, loss: 0.0015111678512766957 2023-01-22 20:49:48.407028: step: 1992/530, loss: 0.003040769835934043 2023-01-22 20:49:49.496055: step: 1996/530, loss: 0.0021007449831813574 2023-01-22 20:49:50.559852: step: 2000/530, loss: 6.046826092642732e-05 2023-01-22 20:49:51.620844: step: 2004/530, loss: 0.011318760924041271 2023-01-22 20:49:52.703198: step: 2008/530, loss: 0.0008086036541499197 2023-01-22 20:49:53.803303: step: 2012/530, loss: 0.001626555691473186 2023-01-22 20:49:54.897043: step: 2016/530, loss: 0.0005122142611071467 2023-01-22 20:49:55.966974: step: 2020/530, loss: 0.006633398588746786 2023-01-22 20:49:57.071268: step: 2024/530, loss: 0.005307371262460947 2023-01-22 20:49:58.165006: step: 2028/530, loss: 0.006337102502584457 2023-01-22 20:49:59.273936: step: 2032/530, loss: 0.0022158240899443626 2023-01-22 20:50:00.373381: step: 2036/530, loss: 0.000360160309355706 2023-01-22 20:50:01.455421: step: 2040/530, loss: 0.006802905350923538 2023-01-22 20:50:02.572221: step: 2044/530, loss: 0.0004644159344024956 2023-01-22 20:50:03.665551: step: 2048/530, loss: 0.0007800815510563552 2023-01-22 20:50:04.761659: step: 2052/530, loss: 0.0002871396718546748 2023-01-22 20:50:05.871148: step: 2056/530, loss: 0.00527344923466444 2023-01-22 20:50:06.951931: step: 2060/530, loss: 3.128217485937057e-06 2023-01-22 20:50:08.069836: step: 2064/530, loss: 0.0019845294300466776 2023-01-22 20:50:09.157165: step: 2068/530, loss: 0.0024314215406775475 2023-01-22 20:50:10.252379: step: 2072/530, loss: 0.011278643272817135 2023-01-22 20:50:11.345188: step: 2076/530, loss: 0.014923572540283203 2023-01-22 20:50:12.427479: step: 2080/530, loss: 0.0012695260811597109 2023-01-22 20:50:13.516222: step: 2084/530, loss: 0.0048428867012262344 2023-01-22 20:50:14.603991: step: 2088/530, loss: 7.22408076399006e-05 2023-01-22 20:50:15.687248: step: 2092/530, loss: 1.5640538549632765e-05 2023-01-22 20:50:16.759334: step: 2096/530, loss: 0.000488990219309926 2023-01-22 20:50:17.837584: step: 2100/530, loss: 0.001418329426087439 2023-01-22 20:50:18.937837: step: 2104/530, loss: 9.549040260026231e-05 2023-01-22 20:50:20.027333: step: 2108/530, loss: 0.0009483927278779447 2023-01-22 20:50:21.119678: step: 2112/530, loss: 0.005046523176133633 2023-01-22 20:50:22.198644: step: 2116/530, loss: 0.006434328854084015 2023-01-22 20:50:23.291365: step: 2120/530, loss: 0.002885560505092144 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34103149757219525, 'r': 0.36173929249119, 'f1': 0.35108030781373323}, 'combined': 0.25869075312590867, 'stategy': 1, 'epoch': 18} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33559104517907207, 'r': 0.2877917271713704, 'f1': 0.3098588244624659}, 'combined': 0.19243863835037356, 'stategy': 1, 'epoch': 18} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34955593205092494, 'r': 0.3455761681186563, 'f1': 0.347554657630786}, 'combined': 0.25609290562268444, 'stategy': 1, 'epoch': 18} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3206897121656956, 'r': 0.2883352604931922, 'f1': 0.303653071206893}, 'combined': 0.1885845389600704, 'stategy': 1, 'epoch': 18} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34647341941162424, 'r': 0.331352188583413, 'f1': 0.3387441384742165}, 'combined': 0.24960094413889639, 'stategy': 1, 'epoch': 18} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3457871409331371, 'r': 0.2956087502942712, 'f1': 0.3187351400192621}, 'combined': 0.19795129748564702, 'stategy': 1, 'epoch': 18} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 18} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.36363636363636365, 'r': 0.5217391304347826, 'f1': 0.42857142857142855}, 'combined': 0.21428571428571427, 'stategy': 1, 'epoch': 18} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 18} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6} ****************************** Epoch: 19 command: python train.py --model_name coref --xlmr_model_name xlm-roberta-large --batch_size 16 --xlmr_learning_rate 2e-5 --accumulate_step 4 --max_epoch 20 --event_hidden_num 500 --p1_data_weight 0.2 --learning_rate 9e-4 2023-01-22 20:52:52.685787: step: 4/530, loss: 0.00010612226469675079 2023-01-22 20:52:53.769087: step: 8/530, loss: 0.002795103471726179 2023-01-22 20:52:54.830377: step: 12/530, loss: 0.0012319920351728797 2023-01-22 20:52:55.924249: step: 16/530, loss: 0.0014200176810845733 2023-01-22 20:52:56.994325: step: 20/530, loss: 0.0016587760765105486 2023-01-22 20:52:58.134467: step: 24/530, loss: 0.0021934101823717356 2023-01-22 20:52:59.210784: step: 28/530, loss: 0.00047815864672884345 2023-01-22 20:53:00.282649: step: 32/530, loss: 0.0005557241966016591 2023-01-22 20:53:01.382733: step: 36/530, loss: 0.0001829547982197255 2023-01-22 20:53:02.450408: step: 40/530, loss: 0.000904804328456521 2023-01-22 20:53:03.543371: step: 44/530, loss: 0.0018636543536558747 2023-01-22 20:53:04.617688: step: 48/530, loss: 0.0014137588441371918 2023-01-22 20:53:05.703912: step: 52/530, loss: 0.000891570933163166 2023-01-22 20:53:06.756443: step: 56/530, loss: 0.004370993003249168 2023-01-22 20:53:07.837357: step: 60/530, loss: 0.0031751038040965796 2023-01-22 20:53:08.945309: step: 64/530, loss: 0.00010741830919869244 2023-01-22 20:53:10.035585: step: 68/530, loss: 4.526889824774116e-05 2023-01-22 20:53:11.129107: step: 72/530, loss: 0.001225336454808712 2023-01-22 20:53:12.209811: step: 76/530, loss: 0.00047454051673412323 2023-01-22 20:53:13.281119: step: 80/530, loss: 0.00041128124576061964 2023-01-22 20:53:14.362640: step: 84/530, loss: 0.006240918301045895 2023-01-22 20:53:15.430819: step: 88/530, loss: 0.0009851172799244523 2023-01-22 20:53:16.522674: step: 92/530, loss: 0.0006712054600939155 2023-01-22 20:53:17.618855: step: 96/530, loss: 0.0036751648876816034 2023-01-22 20:53:18.734332: step: 100/530, loss: 0.0008558948757126927 2023-01-22 20:53:19.820926: step: 104/530, loss: 6.694487819913775e-05 2023-01-22 20:53:20.902038: step: 108/530, loss: 0.0012892525410279632 2023-01-22 20:53:21.998842: step: 112/530, loss: 6.967418357817223e-06 2023-01-22 20:53:23.085368: step: 116/530, loss: 0.003482397645711899 2023-01-22 20:53:24.171603: step: 120/530, loss: 0.0016791452653706074 2023-01-22 20:53:25.253323: step: 124/530, loss: 0.00023542375129181892 2023-01-22 20:53:26.340542: step: 128/530, loss: 0.00030218009487725794 2023-01-22 20:53:27.402488: step: 132/530, loss: 0.0010352826211601496 2023-01-22 20:53:28.476064: step: 136/530, loss: 0.00018657285545486957 2023-01-22 20:53:29.576244: step: 140/530, loss: 0.00039744420791976154 2023-01-22 20:53:30.672471: step: 144/530, loss: 0.0014532171189785004 2023-01-22 20:53:31.768323: step: 148/530, loss: 0.000477830006275326 2023-01-22 20:53:32.848012: step: 152/530, loss: 0.001896329689770937 2023-01-22 20:53:33.939990: step: 156/530, loss: 0.0035541930701583624 2023-01-22 20:53:35.012719: step: 160/530, loss: 0.00035384896909818053 2023-01-22 20:53:36.122618: step: 164/530, loss: 0.00028528578695841134 2023-01-22 20:53:37.192369: step: 168/530, loss: 0.014234398491680622 2023-01-22 20:53:38.307939: step: 172/530, loss: 0.008148133754730225 2023-01-22 20:53:39.389864: step: 176/530, loss: 0.000363050407031551 2023-01-22 20:53:40.478364: step: 180/530, loss: 0.003651235718280077 2023-01-22 20:53:41.557763: step: 184/530, loss: 0.0013336684787645936 2023-01-22 20:53:42.651614: step: 188/530, loss: 6.017145642545074e-05 2023-01-22 20:53:43.751400: step: 192/530, loss: 0.000127437524497509 2023-01-22 20:53:44.849839: step: 196/530, loss: 9.177709580399096e-05 2023-01-22 20:53:45.923671: step: 200/530, loss: 0.0002827983407769352 2023-01-22 20:53:47.015088: step: 204/530, loss: 0.004648215137422085 2023-01-22 20:53:48.093866: step: 208/530, loss: 0.00022543530212715268 2023-01-22 20:53:49.175374: step: 212/530, loss: 0.007725493051111698 2023-01-22 20:53:50.259524: step: 216/530, loss: 2.5174347683787346e-05 2023-01-22 20:53:51.371344: step: 220/530, loss: 0.00765589065849781 2023-01-22 20:53:52.473943: step: 224/530, loss: 0.0007989535224623978 2023-01-22 20:53:53.563920: step: 228/530, loss: 0.0028176598716527224 2023-01-22 20:53:54.652068: step: 232/530, loss: 0.008448977954685688 2023-01-22 20:53:55.737241: step: 236/530, loss: 2.2463866116595455e-05 2023-01-22 20:53:56.804409: step: 240/530, loss: 0.002177407266572118 2023-01-22 20:53:57.905260: step: 244/530, loss: 0.00027448637410998344 2023-01-22 20:53:59.000506: step: 248/530, loss: 0.001832942827604711 2023-01-22 20:54:00.094243: step: 252/530, loss: 0.0022396331187337637 2023-01-22 20:54:01.183082: step: 256/530, loss: 6.207867409102619e-05 2023-01-22 20:54:02.299382: step: 260/530, loss: 0.0022227142471820116 2023-01-22 20:54:03.395891: step: 264/530, loss: 0.005615370813757181 2023-01-22 20:54:04.513029: step: 268/530, loss: 0.0014066529693081975 2023-01-22 20:54:05.593817: step: 272/530, loss: 0.0015630247071385384 2023-01-22 20:54:06.676442: step: 276/530, loss: 0.002412098227068782 2023-01-22 20:54:07.791263: step: 280/530, loss: 0.00030573393451049924 2023-01-22 20:54:08.889775: step: 284/530, loss: 0.0016775837866589427 2023-01-22 20:54:09.980591: step: 288/530, loss: 0.0005219071172177792 2023-01-22 20:54:11.065214: step: 292/530, loss: 0.00039185353671200573 2023-01-22 20:54:12.140942: step: 296/530, loss: 0.0001350231032120064 2023-01-22 20:54:13.228215: step: 300/530, loss: 4.602426542987814e-06 2023-01-22 20:54:14.330713: step: 304/530, loss: 0.002512165578082204 2023-01-22 20:54:15.404583: step: 308/530, loss: 0.01900053396821022 2023-01-22 20:54:16.480101: step: 312/530, loss: 0.0005610514199361205 2023-01-22 20:54:17.574992: step: 316/530, loss: 0.0025838708970695734 2023-01-22 20:54:18.652524: step: 320/530, loss: 0.007404142525047064 2023-01-22 20:54:19.776876: step: 324/530, loss: 7.23678749636747e-05 2023-01-22 20:54:20.877148: step: 328/530, loss: 0.0027387484442442656 2023-01-22 20:54:21.969296: step: 332/530, loss: 0.001112161437049508 2023-01-22 20:54:23.070458: step: 336/530, loss: 0.0007506462861783803 2023-01-22 20:54:24.174101: step: 340/530, loss: 0.0001530869340058416 2023-01-22 20:54:25.246310: step: 344/530, loss: 0.00020024762488901615 2023-01-22 20:54:26.319770: step: 348/530, loss: 0.0019760737195611 2023-01-22 20:54:27.416662: step: 352/530, loss: 0.0029700316954404116 2023-01-22 20:54:28.515470: step: 356/530, loss: 0.00216482556425035 2023-01-22 20:54:29.589876: step: 360/530, loss: 0.0017006483394652605 2023-01-22 20:54:30.692851: step: 364/530, loss: 6.0551388742169365e-05 2023-01-22 20:54:31.778011: step: 368/530, loss: 0.0011895173229277134 2023-01-22 20:54:32.860137: step: 372/530, loss: 0.00020171467622276396 2023-01-22 20:54:33.937651: step: 376/530, loss: 0.015934865921735764 2023-01-22 20:54:35.035568: step: 380/530, loss: 0.0032380190677940845 2023-01-22 20:54:36.116715: step: 384/530, loss: 0.0030422040726989508 2023-01-22 20:54:37.210697: step: 388/530, loss: 0.0017841702792793512 2023-01-22 20:54:38.320551: step: 392/530, loss: 9.812969801714644e-05 2023-01-22 20:54:39.398677: step: 396/530, loss: 0.019144121557474136 2023-01-22 20:54:40.476715: step: 400/530, loss: 2.2069940314395353e-05 2023-01-22 20:54:41.574405: step: 404/530, loss: 0.005186447408050299 2023-01-22 20:54:42.658599: step: 408/530, loss: 0.0006216090405359864 2023-01-22 20:54:43.736789: step: 412/530, loss: 0.0024480412248522043 2023-01-22 20:54:44.823139: step: 416/530, loss: 2.526305615901947e-05 2023-01-22 20:54:45.878319: step: 420/530, loss: 0.0002451435138937086 2023-01-22 20:54:46.952757: step: 424/530, loss: 0.00018999732856173068 2023-01-22 20:54:48.041323: step: 428/530, loss: 0.00024223285436164588 2023-01-22 20:54:49.111987: step: 432/530, loss: 0.00017848741845227778 2023-01-22 20:54:50.195346: step: 436/530, loss: 8.253068517660722e-05 2023-01-22 20:54:51.305956: step: 440/530, loss: 8.181794692063704e-05 2023-01-22 20:54:52.418134: step: 444/530, loss: 0.0002570562355685979 2023-01-22 20:54:53.518717: step: 448/530, loss: 0.006813338026404381 2023-01-22 20:54:54.609461: step: 452/530, loss: 0.0002035939833149314 2023-01-22 20:54:55.691726: step: 456/530, loss: 9.507857612334192e-05 2023-01-22 20:54:56.757004: step: 460/530, loss: 0.000119017917313613 2023-01-22 20:54:57.838540: step: 464/530, loss: 0.012260710820555687 2023-01-22 20:54:58.903843: step: 468/530, loss: 0.0008721818448975682 2023-01-22 20:54:59.984605: step: 472/530, loss: 0.003999961540102959 2023-01-22 20:55:01.058211: step: 476/530, loss: 0.0023704753257334232 2023-01-22 20:55:02.128753: step: 480/530, loss: 0.0006542131886817515 2023-01-22 20:55:03.211609: step: 484/530, loss: 0.0005305339582264423 2023-01-22 20:55:04.316064: step: 488/530, loss: 0.000548834796063602 2023-01-22 20:55:05.393288: step: 492/530, loss: 9.316128125647083e-05 2023-01-22 20:55:06.461410: step: 496/530, loss: 0.0001876260939752683 2023-01-22 20:55:07.565505: step: 500/530, loss: 0.00029482279205694795 2023-01-22 20:55:08.631294: step: 504/530, loss: 0.0027160996105521917 2023-01-22 20:55:09.732691: step: 508/530, loss: 0.004169796593487263 2023-01-22 20:55:10.832078: step: 512/530, loss: 0.00419542146846652 2023-01-22 20:55:11.933019: step: 516/530, loss: 0.001662172027863562 2023-01-22 20:55:13.012685: step: 520/530, loss: 0.005924543831497431 2023-01-22 20:55:14.100806: step: 524/530, loss: 0.0092924814671278 2023-01-22 20:55:15.183449: step: 528/530, loss: 0.0023686615750193596 2023-01-22 20:55:16.264555: step: 532/530, loss: 5.9015434089815244e-05 2023-01-22 20:55:17.400416: step: 536/530, loss: 0.0017717560986056924 2023-01-22 20:55:18.486994: step: 540/530, loss: 1.6681902707205154e-05 2023-01-22 20:55:19.592850: step: 544/530, loss: 0.00023030232114251703 2023-01-22 20:55:20.689680: step: 548/530, loss: 0.0010691189672797918 2023-01-22 20:55:21.780685: step: 552/530, loss: 7.2947092121467e-05 2023-01-22 20:55:22.875944: step: 556/530, loss: 2.7744817998609506e-06 2023-01-22 20:55:23.982685: step: 560/530, loss: 0.005825372412800789 2023-01-22 20:55:25.071853: step: 564/530, loss: 0.0008699214085936546 2023-01-22 20:55:26.149586: step: 568/530, loss: 0.001545156235806644 2023-01-22 20:55:27.247354: step: 572/530, loss: 0.0002815865445882082 2023-01-22 20:55:28.324799: step: 576/530, loss: 0.00023228765348903835 2023-01-22 20:55:29.394486: step: 580/530, loss: 0.0028442859183996916 2023-01-22 20:55:30.506045: step: 584/530, loss: 0.0023350215051323175 2023-01-22 20:55:31.590550: step: 588/530, loss: 0.0016820277087390423 2023-01-22 20:55:32.673079: step: 592/530, loss: 0.0029673816170543432 2023-01-22 20:55:33.775639: step: 596/530, loss: 0.007681077811866999 2023-01-22 20:55:34.881341: step: 600/530, loss: 0.0013397708535194397 2023-01-22 20:55:35.981223: step: 604/530, loss: 0.009949568659067154 2023-01-22 20:55:37.067049: step: 608/530, loss: 0.0012124726781621575 2023-01-22 20:55:38.153370: step: 612/530, loss: 0.0006463738391175866 2023-01-22 20:55:39.253682: step: 616/530, loss: 0.0006983615458011627 2023-01-22 20:55:40.337320: step: 620/530, loss: 0.0014640305889770389 2023-01-22 20:55:41.427146: step: 624/530, loss: 0.009332627058029175 2023-01-22 20:55:42.539350: step: 628/530, loss: 0.005885405000299215 2023-01-22 20:55:43.612000: step: 632/530, loss: 0.00014350692799780518 2023-01-22 20:55:44.683768: step: 636/530, loss: 0.008285566233098507 2023-01-22 20:55:45.762056: step: 640/530, loss: 0.0022046321537345648 2023-01-22 20:55:46.835297: step: 644/530, loss: 0.0009495335398241878 2023-01-22 20:55:47.905568: step: 648/530, loss: 0.0006517135188914835 2023-01-22 20:55:48.992622: step: 652/530, loss: 0.00010133364412467927 2023-01-22 20:55:50.089736: step: 656/530, loss: 0.0028543220832943916 2023-01-22 20:55:51.185292: step: 660/530, loss: 0.0031247297301888466 2023-01-22 20:55:52.265551: step: 664/530, loss: 0.003758001606911421 2023-01-22 20:55:53.371609: step: 668/530, loss: 0.0018406884046271443 2023-01-22 20:55:54.469500: step: 672/530, loss: 0.0063645802438259125 2023-01-22 20:55:55.559843: step: 676/530, loss: 0.0034332971554249525 2023-01-22 20:55:56.670873: step: 680/530, loss: 0.009605745784938335 2023-01-22 20:55:57.765877: step: 684/530, loss: 0.00012636395695153624 2023-01-22 20:55:58.865270: step: 688/530, loss: 0.0013792074751108885 2023-01-22 20:55:59.940271: step: 692/530, loss: 0.0034518863540142775 2023-01-22 20:56:01.054441: step: 696/530, loss: 0.0015571805415675044 2023-01-22 20:56:02.140583: step: 700/530, loss: 0.002138337818905711 2023-01-22 20:56:03.229160: step: 704/530, loss: 0.0003091080579906702 2023-01-22 20:56:04.317783: step: 708/530, loss: 0.0021379266399890184 2023-01-22 20:56:05.396644: step: 712/530, loss: 0.0001398646563757211 2023-01-22 20:56:06.473029: step: 716/530, loss: 0.0006683410611003637 2023-01-22 20:56:07.577921: step: 720/530, loss: 0.0028443525079637766 2023-01-22 20:56:08.656054: step: 724/530, loss: 0.014140930958092213 2023-01-22 20:56:09.727582: step: 728/530, loss: 6.861837755423039e-05 2023-01-22 20:56:10.827672: step: 732/530, loss: 0.006302974186837673 2023-01-22 20:56:11.911717: step: 736/530, loss: 8.41275614220649e-05 2023-01-22 20:56:13.000216: step: 740/530, loss: 0.0009295594063587487 2023-01-22 20:56:14.103361: step: 744/530, loss: 5.107237370793882e-07 2023-01-22 20:56:15.197122: step: 748/530, loss: 0.017124244943261147 2023-01-22 20:56:16.282856: step: 752/530, loss: 0.0032133159693330526 2023-01-22 20:56:17.373801: step: 756/530, loss: 0.000350703252479434 2023-01-22 20:56:18.486581: step: 760/530, loss: 0.0019325226312503219 2023-01-22 20:56:19.578638: step: 764/530, loss: 1.0375431884313002e-05 2023-01-22 20:56:20.677083: step: 768/530, loss: 0.003244813997298479 2023-01-22 20:56:21.748898: step: 772/530, loss: 0.0023170344065874815 2023-01-22 20:56:22.819553: step: 776/530, loss: 0.0005471422919072211 2023-01-22 20:56:23.888540: step: 780/530, loss: 1.1085880032624118e-05 2023-01-22 20:56:24.966225: step: 784/530, loss: 0.000662175239995122 2023-01-22 20:56:26.044530: step: 788/530, loss: 0.0012159064644947648 2023-01-22 20:56:27.120169: step: 792/530, loss: 0.0001026913887471892 2023-01-22 20:56:28.207152: step: 796/530, loss: 0.00013545122055802494 2023-01-22 20:56:29.289586: step: 800/530, loss: 0.00039481211570091546 2023-01-22 20:56:30.356805: step: 804/530, loss: 1.8506450942368247e-05 2023-01-22 20:56:31.437750: step: 808/530, loss: 0.0007518731872551143 2023-01-22 20:56:32.532550: step: 812/530, loss: 0.005355015397071838 2023-01-22 20:56:33.652588: step: 816/530, loss: 0.009262152016162872 2023-01-22 20:56:34.734699: step: 820/530, loss: 0.002548203570768237 2023-01-22 20:56:35.838388: step: 824/530, loss: 0.002876387210562825 2023-01-22 20:56:36.942315: step: 828/530, loss: 0.0020748015958815813 2023-01-22 20:56:38.027726: step: 832/530, loss: 0.0003181732026860118 2023-01-22 20:56:39.117278: step: 836/530, loss: 0.002926662564277649 2023-01-22 20:56:40.193895: step: 840/530, loss: 0.0003673312603496015 2023-01-22 20:56:41.265669: step: 844/530, loss: 0.0016110616270452738 2023-01-22 20:56:42.367467: step: 848/530, loss: 0.0030272037256509066 2023-01-22 20:56:43.459189: step: 852/530, loss: 0.003720643697306514 2023-01-22 20:56:44.579834: step: 856/530, loss: 0.003420489374548197 2023-01-22 20:56:45.688299: step: 860/530, loss: 0.000681612640619278 2023-01-22 20:56:46.759489: step: 864/530, loss: 0.0010235266527161002 2023-01-22 20:56:47.855886: step: 868/530, loss: 1.1331835594319273e-06 2023-01-22 20:56:48.931397: step: 872/530, loss: 0.008483139798045158 2023-01-22 20:56:50.018186: step: 876/530, loss: 0.0013104387326166034 2023-01-22 20:56:51.124567: step: 880/530, loss: 0.0011970880441367626 2023-01-22 20:56:52.195805: step: 884/530, loss: 6.7724345171882305e-06 2023-01-22 20:56:53.257556: step: 888/530, loss: 0.001854976057074964 2023-01-22 20:56:54.340367: step: 892/530, loss: 2.076085911539849e-05 2023-01-22 20:56:55.472435: step: 896/530, loss: 0.00039890181506052613 2023-01-22 20:56:56.549177: step: 900/530, loss: 0.0029576276428997517 2023-01-22 20:56:57.610941: step: 904/530, loss: 0.00693677319213748 2023-01-22 20:56:58.687407: step: 908/530, loss: 6.96541610523127e-05 2023-01-22 20:56:59.755046: step: 912/530, loss: 0.003066401928663254 2023-01-22 20:57:00.827210: step: 916/530, loss: 0.0022195763885974884 2023-01-22 20:57:01.916007: step: 920/530, loss: 0.006827932316809893 2023-01-22 20:57:03.012272: step: 924/530, loss: 0.0006443933816626668 2023-01-22 20:57:04.090233: step: 928/530, loss: 0.0010862374911084771 2023-01-22 20:57:05.166969: step: 932/530, loss: 0.001978747546672821 2023-01-22 20:57:06.253301: step: 936/530, loss: 0.0017067306907847524 2023-01-22 20:57:07.328041: step: 940/530, loss: 0.0002453155757393688 2023-01-22 20:57:08.423514: step: 944/530, loss: 0.0022631175816059113 2023-01-22 20:57:09.494379: step: 948/530, loss: 0.01073909830302 2023-01-22 20:57:10.568480: step: 952/530, loss: 2.1372539777075872e-05 2023-01-22 20:57:11.654711: step: 956/530, loss: 0.0018166899681091309 2023-01-22 20:57:12.758703: step: 960/530, loss: 0.0018802545964717865 2023-01-22 20:57:13.853713: step: 964/530, loss: 0.00030414227512665093 2023-01-22 20:57:14.946618: step: 968/530, loss: 0.049407340586185455 2023-01-22 20:57:16.037968: step: 972/530, loss: 0.002354665659368038 2023-01-22 20:57:17.114134: step: 976/530, loss: 0.0006467264611274004 2023-01-22 20:57:18.217909: step: 980/530, loss: 0.0002191751846112311 2023-01-22 20:57:19.297097: step: 984/530, loss: 1.0901581845246255e-05 2023-01-22 20:57:20.390339: step: 988/530, loss: 0.010003658942878246 2023-01-22 20:57:21.476280: step: 992/530, loss: 0.0028742491267621517 2023-01-22 20:57:22.580929: step: 996/530, loss: 0.003459608880802989 2023-01-22 20:57:23.674793: step: 1000/530, loss: 0.009734617546200752 2023-01-22 20:57:24.749044: step: 1004/530, loss: 0.004015708342194557 2023-01-22 20:57:25.833025: step: 1008/530, loss: 0.003532921662554145 2023-01-22 20:57:26.907053: step: 1012/530, loss: 0.005811508744955063 2023-01-22 20:57:28.001884: step: 1016/530, loss: 0.00032728290534578264 2023-01-22 20:57:29.102008: step: 1020/530, loss: 0.005041017197072506 2023-01-22 20:57:30.187060: step: 1024/530, loss: 0.000962086021900177 2023-01-22 20:57:31.282606: step: 1028/530, loss: 0.0015051723457872868 2023-01-22 20:57:32.374214: step: 1032/530, loss: 0.004779349081218243 2023-01-22 20:57:33.452272: step: 1036/530, loss: 0.0036869365721940994 2023-01-22 20:57:34.551925: step: 1040/530, loss: 0.004515713546425104 2023-01-22 20:57:35.647526: step: 1044/530, loss: 0.003777437610551715 2023-01-22 20:57:36.737038: step: 1048/530, loss: 0.033518899232149124 2023-01-22 20:57:37.793842: step: 1052/530, loss: 0.011628029868006706 2023-01-22 20:57:38.902686: step: 1056/530, loss: 0.0055001419968903065 2023-01-22 20:57:39.994050: step: 1060/530, loss: 0.00013690949708689004 2023-01-22 20:57:41.050539: step: 1064/530, loss: 0.00268448400311172 2023-01-22 20:57:42.124519: step: 1068/530, loss: 0.0015796461375430226 2023-01-22 20:57:43.216765: step: 1072/530, loss: 0.00010647771705407649 2023-01-22 20:57:44.307429: step: 1076/530, loss: 0.0041709779761731625 2023-01-22 20:57:45.400614: step: 1080/530, loss: 0.006433352828025818 2023-01-22 20:57:46.501528: step: 1084/530, loss: 0.007411969359964132 2023-01-22 20:57:47.597369: step: 1088/530, loss: 0.005055057816207409 2023-01-22 20:57:48.702215: step: 1092/530, loss: 0.0061180428601801395 2023-01-22 20:57:49.831375: step: 1096/530, loss: 0.0036884101573377848 2023-01-22 20:57:50.912278: step: 1100/530, loss: 0.003087639342993498 2023-01-22 20:57:52.029734: step: 1104/530, loss: 0.0006503356853500009 2023-01-22 20:57:53.099997: step: 1108/530, loss: 0.0012748206499963999 2023-01-22 20:57:54.180304: step: 1112/530, loss: 0.015659553930163383 2023-01-22 20:57:55.248723: step: 1116/530, loss: 0.00022522902872879058 2023-01-22 20:57:56.328717: step: 1120/530, loss: 0.00029547931626439095 2023-01-22 20:57:57.408579: step: 1124/530, loss: 0.00232200906611979 2023-01-22 20:57:58.484760: step: 1128/530, loss: 0.0037394037935882807 2023-01-22 20:57:59.558624: step: 1132/530, loss: 0.00022217437799554318 2023-01-22 20:58:00.649249: step: 1136/530, loss: 0.002667974680662155 2023-01-22 20:58:01.748426: step: 1140/530, loss: 6.199646304594353e-05 2023-01-22 20:58:02.828926: step: 1144/530, loss: 0.005206217523664236 2023-01-22 20:58:03.911136: step: 1148/530, loss: 0.0010839808965101838 2023-01-22 20:58:05.003382: step: 1152/530, loss: 0.0003359429829288274 2023-01-22 20:58:06.077543: step: 1156/530, loss: 0.0031326801981776953 2023-01-22 20:58:07.182251: step: 1160/530, loss: 0.0006840827991254628 2023-01-22 20:58:08.280685: step: 1164/530, loss: 5.298924588714726e-05 2023-01-22 20:58:09.348276: step: 1168/530, loss: 0.00036467472091317177 2023-01-22 20:58:10.425576: step: 1172/530, loss: 0.0008015702478587627 2023-01-22 20:58:11.512427: step: 1176/530, loss: 0.001813840470276773 2023-01-22 20:58:12.624740: step: 1180/530, loss: 0.004003350622951984 2023-01-22 20:58:13.710141: step: 1184/530, loss: 3.4948625398101285e-05 2023-01-22 20:58:14.804086: step: 1188/530, loss: 0.001791725168004632 2023-01-22 20:58:15.885919: step: 1192/530, loss: 0.0007922702352516353 2023-01-22 20:58:16.977969: step: 1196/530, loss: 0.15773484110832214 2023-01-22 20:58:18.060742: step: 1200/530, loss: 0.0003773942880798131 2023-01-22 20:58:19.124219: step: 1204/530, loss: 0.002099961508065462 2023-01-22 20:58:20.208966: step: 1208/530, loss: 9.61387122515589e-05 2023-01-22 20:58:21.311062: step: 1212/530, loss: 0.007378213107585907 2023-01-22 20:58:22.420831: step: 1216/530, loss: 0.012547855265438557 2023-01-22 20:58:23.504814: step: 1220/530, loss: 0.003913717810064554 2023-01-22 20:58:24.600355: step: 1224/530, loss: 0.0003519150777719915 2023-01-22 20:58:25.708533: step: 1228/530, loss: 0.005848758388310671 2023-01-22 20:58:26.807449: step: 1232/530, loss: 0.0011302847415208817 2023-01-22 20:58:27.885176: step: 1236/530, loss: 0.00032962014665827155 2023-01-22 20:58:28.996556: step: 1240/530, loss: 0.0030261704232543707 2023-01-22 20:58:30.090609: step: 1244/530, loss: 0.011049726977944374 2023-01-22 20:58:31.197926: step: 1248/530, loss: 0.00032516149803996086 2023-01-22 20:58:32.278219: step: 1252/530, loss: 0.0026952135376632214 2023-01-22 20:58:33.343959: step: 1256/530, loss: 0.004448683466762304 2023-01-22 20:58:34.431008: step: 1260/530, loss: 0.004877091385424137 2023-01-22 20:58:35.498562: step: 1264/530, loss: 0.0021662248764187098 2023-01-22 20:58:36.551332: step: 1268/530, loss: 5.9905862144660205e-05 2023-01-22 20:58:37.636795: step: 1272/530, loss: 9.155741764743652e-08 2023-01-22 20:58:38.736565: step: 1276/530, loss: 0.0010946731781587005 2023-01-22 20:58:39.815356: step: 1280/530, loss: 0.0028232859913259745 2023-01-22 20:58:40.901574: step: 1284/530, loss: 1.7036798453773372e-05 2023-01-22 20:58:42.009653: step: 1288/530, loss: 0.0023632789961993694 2023-01-22 20:58:43.075784: step: 1292/530, loss: 0.0003779674007091671 2023-01-22 20:58:44.176177: step: 1296/530, loss: 0.00283479574136436 2023-01-22 20:58:45.247150: step: 1300/530, loss: 0.0018201533239334822 2023-01-22 20:58:46.329362: step: 1304/530, loss: 0.0012148297391831875 2023-01-22 20:58:47.414489: step: 1308/530, loss: 0.002993691945448518 2023-01-22 20:58:48.510921: step: 1312/530, loss: 0.00023005179536994547 2023-01-22 20:58:49.579472: step: 1316/530, loss: 0.0011218771105632186 2023-01-22 20:58:50.696405: step: 1320/530, loss: 0.021919548511505127 2023-01-22 20:58:51.772498: step: 1324/530, loss: 0.004026548471301794 2023-01-22 20:58:52.851016: step: 1328/530, loss: 0.00016143418906722218 2023-01-22 20:58:53.943169: step: 1332/530, loss: 4.627986811556184e-07 2023-01-22 20:58:55.038867: step: 1336/530, loss: 0.0022843223996460438 2023-01-22 20:58:56.143360: step: 1340/530, loss: 1.7791131540434435e-05 2023-01-22 20:58:57.233418: step: 1344/530, loss: 0.00043966970406472683 2023-01-22 20:58:58.300492: step: 1348/530, loss: 2.274669668622664e-06 2023-01-22 20:58:59.404730: step: 1352/530, loss: 0.0002892041520681232 2023-01-22 20:59:00.501884: step: 1356/530, loss: 0.010213593952357769 2023-01-22 20:59:01.592730: step: 1360/530, loss: 0.0008568572229705751 2023-01-22 20:59:02.690094: step: 1364/530, loss: 0.0035403133369982243 2023-01-22 20:59:03.777244: step: 1368/530, loss: 3.521113467286341e-05 2023-01-22 20:59:04.847032: step: 1372/530, loss: 0.0009181509376503527 2023-01-22 20:59:05.935840: step: 1376/530, loss: 1.4798672054894269e-05 2023-01-22 20:59:07.007853: step: 1380/530, loss: 0.0009366365848109126 2023-01-22 20:59:08.111606: step: 1384/530, loss: 0.004516437649726868 2023-01-22 20:59:09.193188: step: 1388/530, loss: 4.533562605502084e-05 2023-01-22 20:59:10.280851: step: 1392/530, loss: 0.004407972097396851 2023-01-22 20:59:11.352116: step: 1396/530, loss: 0.0036491043865680695 2023-01-22 20:59:12.460699: step: 1400/530, loss: 0.0002919454127550125 2023-01-22 20:59:13.532804: step: 1404/530, loss: 7.566505519207567e-05 2023-01-22 20:59:14.632468: step: 1408/530, loss: 0.0027953805401921272 2023-01-22 20:59:15.714821: step: 1412/530, loss: 0.0008610638324171305 2023-01-22 20:59:16.791426: step: 1416/530, loss: 0.00381405814550817 2023-01-22 20:59:17.879277: step: 1420/530, loss: 0.0026882088277488947 2023-01-22 20:59:18.963349: step: 1424/530, loss: 0.0 2023-01-22 20:59:20.041857: step: 1428/530, loss: 0.0005442898836918175 2023-01-22 20:59:21.131146: step: 1432/530, loss: 6.463371391873807e-05 2023-01-22 20:59:22.215112: step: 1436/530, loss: 0.000184837932465598 2023-01-22 20:59:23.298818: step: 1440/530, loss: 0.009980302304029465 2023-01-22 20:59:24.380690: step: 1444/530, loss: 0.00011968673788942397 2023-01-22 20:59:25.464560: step: 1448/530, loss: 0.00013466255040839314 2023-01-22 20:59:26.558570: step: 1452/530, loss: 0.00279190088622272 2023-01-22 20:59:27.674944: step: 1456/530, loss: 0.006928619928658009 2023-01-22 20:59:28.736186: step: 1460/530, loss: 9.136817311627965e-07 2023-01-22 20:59:29.825807: step: 1464/530, loss: 0.0032755162101238966 2023-01-22 20:59:30.924425: step: 1468/530, loss: 0.0009578948956914246 2023-01-22 20:59:32.032500: step: 1472/530, loss: 0.004956020042300224 2023-01-22 20:59:33.116135: step: 1476/530, loss: 0.0014834189787507057 2023-01-22 20:59:34.191183: step: 1480/530, loss: 0.002009877236559987 2023-01-22 20:59:35.288902: step: 1484/530, loss: 0.0029133677016943693 2023-01-22 20:59:36.384889: step: 1488/530, loss: 0.020586330443620682 2023-01-22 20:59:37.460369: step: 1492/530, loss: 0.0013607380678877234 2023-01-22 20:59:38.542422: step: 1496/530, loss: 0.0030814907513558865 2023-01-22 20:59:39.613879: step: 1500/530, loss: 0.002972833812236786 2023-01-22 20:59:40.693118: step: 1504/530, loss: 0.0015024917665868998 2023-01-22 20:59:41.798727: step: 1508/530, loss: 0.0028529074043035507 2023-01-22 20:59:42.876322: step: 1512/530, loss: 0.002402563113719225 2023-01-22 20:59:43.939691: step: 1516/530, loss: 9.545624197926372e-05 2023-01-22 20:59:45.050109: step: 1520/530, loss: 0.0005605558399111032 2023-01-22 20:59:46.132038: step: 1524/530, loss: 0.002436092123389244 2023-01-22 20:59:47.228594: step: 1528/530, loss: 0.039780210703611374 2023-01-22 20:59:48.301432: step: 1532/530, loss: 0.0001810369867598638 2023-01-22 20:59:49.399776: step: 1536/530, loss: 0.0003175641468260437 2023-01-22 20:59:50.472627: step: 1540/530, loss: 8.467099519293697e-07 2023-01-22 20:59:51.574116: step: 1544/530, loss: 0.000988020095974207 2023-01-22 20:59:52.679193: step: 1548/530, loss: 0.004215283785015345 2023-01-22 20:59:53.751490: step: 1552/530, loss: 1.9923118088627234e-06 2023-01-22 20:59:54.840170: step: 1556/530, loss: 0.0009153741411864758 2023-01-22 20:59:55.928523: step: 1560/530, loss: 0.0030492425430566072 2023-01-22 20:59:57.024737: step: 1564/530, loss: 1.3904646039009094e-06 2023-01-22 20:59:58.131168: step: 1568/530, loss: 0.0020644599571824074 2023-01-22 20:59:59.209989: step: 1572/530, loss: 0.000401181896449998 2023-01-22 21:00:00.284784: step: 1576/530, loss: 0.0018996200524270535 2023-01-22 21:00:01.359983: step: 1580/530, loss: 0.003534716786816716 2023-01-22 21:00:02.445702: step: 1584/530, loss: 6.729322922183201e-05 2023-01-22 21:00:03.522045: step: 1588/530, loss: 0.003328819992020726 2023-01-22 21:00:04.594758: step: 1592/530, loss: 0.04004179313778877 2023-01-22 21:00:05.687518: step: 1596/530, loss: 0.010661550797522068 2023-01-22 21:00:06.757376: step: 1600/530, loss: 0.0017881629755720496 2023-01-22 21:00:07.814221: step: 1604/530, loss: 0.0039047240279614925 2023-01-22 21:00:08.923693: step: 1608/530, loss: 3.2011335861170664e-05 2023-01-22 21:00:10.033400: step: 1612/530, loss: 0.00015045386680867523 2023-01-22 21:00:11.120368: step: 1616/530, loss: 4.442041245056316e-05 2023-01-22 21:00:12.203176: step: 1620/530, loss: 5.109552603244083e-06 2023-01-22 21:00:13.288263: step: 1624/530, loss: 0.0009275132906623185 2023-01-22 21:00:14.377416: step: 1628/530, loss: 0.0034423477482050657 2023-01-22 21:00:15.450673: step: 1632/530, loss: 0.0028966316021978855 2023-01-22 21:00:16.527033: step: 1636/530, loss: 0.000514811894390732 2023-01-22 21:00:17.607322: step: 1640/530, loss: 0.0007470088894478977 2023-01-22 21:00:18.703945: step: 1644/530, loss: 0.008726184256374836 2023-01-22 21:00:19.773957: step: 1648/530, loss: 0.00019980079378001392 2023-01-22 21:00:20.879665: step: 1652/530, loss: 0.006958498619496822 2023-01-22 21:00:21.966736: step: 1656/530, loss: 0.002085222862660885 2023-01-22 21:00:23.051831: step: 1660/530, loss: 0.001445403671823442 2023-01-22 21:00:24.160530: step: 1664/530, loss: 0.0021974630653858185 2023-01-22 21:00:25.225191: step: 1668/530, loss: 0.0 2023-01-22 21:00:26.318230: step: 1672/530, loss: 0.012715769000351429 2023-01-22 21:00:27.421147: step: 1676/530, loss: 0.003582859179005027 2023-01-22 21:00:28.512962: step: 1680/530, loss: 0.005014185793697834 2023-01-22 21:00:29.579932: step: 1684/530, loss: 0.00012731069000437856 2023-01-22 21:00:30.662026: step: 1688/530, loss: 0.007671989034861326 2023-01-22 21:00:31.767015: step: 1692/530, loss: 3.5964432754553854e-05 2023-01-22 21:00:32.855458: step: 1696/530, loss: 2.128567393810954e-05 2023-01-22 21:00:33.982877: step: 1700/530, loss: 0.0025053133722394705 2023-01-22 21:00:35.087641: step: 1704/530, loss: 0.005780582781881094 2023-01-22 21:00:36.181520: step: 1708/530, loss: 0.001596905873157084 2023-01-22 21:00:37.257168: step: 1712/530, loss: 1.1687239748425782e-05 2023-01-22 21:00:38.376420: step: 1716/530, loss: 0.008107785135507584 2023-01-22 21:00:39.445662: step: 1720/530, loss: 0.0016066232929006219 2023-01-22 21:00:40.517678: step: 1724/530, loss: 6.309814125415869e-06 2023-01-22 21:00:41.608178: step: 1728/530, loss: 9.108841186389327e-05 2023-01-22 21:00:42.699930: step: 1732/530, loss: 1.4966180970077403e-05 2023-01-22 21:00:43.778131: step: 1736/530, loss: 0.00019453787535894662 2023-01-22 21:00:44.832359: step: 1740/530, loss: 0.0001246624015038833 2023-01-22 21:00:45.918256: step: 1744/530, loss: 0.005154330749064684 2023-01-22 21:00:47.009309: step: 1748/530, loss: 0.00010170163295697421 2023-01-22 21:00:48.090396: step: 1752/530, loss: 0.0018698968924582005 2023-01-22 21:00:49.156252: step: 1756/530, loss: 6.83599864714779e-05 2023-01-22 21:00:50.251221: step: 1760/530, loss: 0.008800136856734753 2023-01-22 21:00:51.333870: step: 1764/530, loss: 0.0049568661488592625 2023-01-22 21:00:52.419577: step: 1768/530, loss: 0.0018267015693709254 2023-01-22 21:00:53.516904: step: 1772/530, loss: 0.005369527265429497 2023-01-22 21:00:54.594204: step: 1776/530, loss: 0.00037364373565651476 2023-01-22 21:00:55.694713: step: 1780/530, loss: 0.0002443153935018927 2023-01-22 21:00:56.789396: step: 1784/530, loss: 0.0006877300911583006 2023-01-22 21:00:57.886406: step: 1788/530, loss: 0.018640106543898582 2023-01-22 21:00:58.998835: step: 1792/530, loss: 0.002196121495217085 2023-01-22 21:01:00.072872: step: 1796/530, loss: 2.3374448119284352e-06 2023-01-22 21:01:01.167799: step: 1800/530, loss: 0.0038667176850140095 2023-01-22 21:01:02.267110: step: 1804/530, loss: 0.0031091426499187946 2023-01-22 21:01:03.388520: step: 1808/530, loss: 0.0022826758213341236 2023-01-22 21:01:04.468285: step: 1812/530, loss: 0.009245526976883411 2023-01-22 21:01:05.551021: step: 1816/530, loss: 0.00012097950821043923 2023-01-22 21:01:06.638557: step: 1820/530, loss: 5.00375208503101e-05 2023-01-22 21:01:07.715365: step: 1824/530, loss: 0.00012188960681669414 2023-01-22 21:01:08.806859: step: 1828/530, loss: 0.00023899287043605 2023-01-22 21:01:09.908830: step: 1832/530, loss: 0.0010847916128113866 2023-01-22 21:01:10.989249: step: 1836/530, loss: 0.0029559554532170296 2023-01-22 21:01:12.091629: step: 1840/530, loss: 0.00029525961144827306 2023-01-22 21:01:13.213318: step: 1844/530, loss: 0.006062031257897615 2023-01-22 21:01:14.312578: step: 1848/530, loss: 0.0027633002027869225 2023-01-22 21:01:15.413225: step: 1852/530, loss: 0.005294295493513346 2023-01-22 21:01:16.514278: step: 1856/530, loss: 0.0035847793333232403 2023-01-22 21:01:17.620312: step: 1860/530, loss: 0.000911436160095036 2023-01-22 21:01:18.691894: step: 1864/530, loss: 5.170115036889911e-05 2023-01-22 21:01:19.783920: step: 1868/530, loss: 0.0066793388687074184 2023-01-22 21:01:20.852316: step: 1872/530, loss: 0.001877503120340407 2023-01-22 21:01:21.955023: step: 1876/530, loss: 0.002873568329960108 2023-01-22 21:01:23.019753: step: 1880/530, loss: 0.0007109367288649082 2023-01-22 21:01:24.088750: step: 1884/530, loss: 0.0017746200319379568 2023-01-22 21:01:25.168252: step: 1888/530, loss: 0.02019747719168663 2023-01-22 21:01:26.230711: step: 1892/530, loss: 0.004764596465975046 2023-01-22 21:01:27.332075: step: 1896/530, loss: 0.012391520664095879 2023-01-22 21:01:28.415553: step: 1900/530, loss: 0.0039004029240459204 2023-01-22 21:01:29.549469: step: 1904/530, loss: 0.010178638622164726 2023-01-22 21:01:30.611122: step: 1908/530, loss: 0.005706189200282097 2023-01-22 21:01:31.705869: step: 1912/530, loss: 0.006951368413865566 2023-01-22 21:01:32.783396: step: 1916/530, loss: 0.009065288119018078 2023-01-22 21:01:33.866551: step: 1920/530, loss: 2.1797888621222228e-05 2023-01-22 21:01:34.952662: step: 1924/530, loss: 0.005138007458299398 2023-01-22 21:01:36.051531: step: 1928/530, loss: 0.018205001950263977 2023-01-22 21:01:37.131303: step: 1932/530, loss: 0.0029143067076802254 2023-01-22 21:01:38.227418: step: 1936/530, loss: 0.0014819448115304112 2023-01-22 21:01:39.316710: step: 1940/530, loss: 0.00012170481204520911 2023-01-22 21:01:40.419401: step: 1944/530, loss: 0.013513009063899517 2023-01-22 21:01:41.488942: step: 1948/530, loss: 0.0028930676635354757 2023-01-22 21:01:42.553571: step: 1952/530, loss: 0.002232213271781802 2023-01-22 21:01:43.642365: step: 1956/530, loss: 0.004743141587823629 2023-01-22 21:01:44.730425: step: 1960/530, loss: 0.004425340332090855 2023-01-22 21:01:45.824994: step: 1964/530, loss: 0.00034303279244340956 2023-01-22 21:01:46.915813: step: 1968/530, loss: 0.008089178241789341 2023-01-22 21:01:48.025157: step: 1972/530, loss: 0.0010775779373943806 2023-01-22 21:01:49.107557: step: 1976/530, loss: 0.0030615869909524918 2023-01-22 21:01:50.182817: step: 1980/530, loss: 1.655684478407693e-10 2023-01-22 21:01:51.318904: step: 1984/530, loss: 3.54763978975825e-05 2023-01-22 21:01:52.423276: step: 1988/530, loss: 5.670629252563231e-05 2023-01-22 21:01:53.495926: step: 1992/530, loss: 0.006418494042009115 2023-01-22 21:01:54.580958: step: 1996/530, loss: 0.006443052552640438 2023-01-22 21:01:55.653755: step: 2000/530, loss: 0.00046917388681322336 2023-01-22 21:01:56.767011: step: 2004/530, loss: 0.010000565089285374 2023-01-22 21:01:57.876839: step: 2008/530, loss: 0.001778299454599619 2023-01-22 21:01:58.956788: step: 2012/530, loss: 0.0016366541385650635 2023-01-22 21:02:00.031629: step: 2016/530, loss: 0.0017698848387226462 2023-01-22 21:02:01.131418: step: 2020/530, loss: 5.0431299314368516e-05 2023-01-22 21:02:02.195393: step: 2024/530, loss: 1.473018892284017e-05 2023-01-22 21:02:03.291688: step: 2028/530, loss: 0.0054372879676520824 2023-01-22 21:02:04.372384: step: 2032/530, loss: 0.013245935551822186 2023-01-22 21:02:05.457330: step: 2036/530, loss: 0.008621656335890293 2023-01-22 21:02:06.535438: step: 2040/530, loss: 0.0005633449763990939 2023-01-22 21:02:07.618209: step: 2044/530, loss: 0.0005284935468807817 2023-01-22 21:02:08.718739: step: 2048/530, loss: 0.007640881463885307 2023-01-22 21:02:09.800528: step: 2052/530, loss: 0.0004758746363222599 2023-01-22 21:02:10.904476: step: 2056/530, loss: 0.0018036675173789263 2023-01-22 21:02:11.996063: step: 2060/530, loss: 0.001490497961640358 2023-01-22 21:02:13.078659: step: 2064/530, loss: 0.004089886322617531 2023-01-22 21:02:14.152021: step: 2068/530, loss: 0.005039777606725693 2023-01-22 21:02:15.240563: step: 2072/530, loss: 0.0077629066072404385 2023-01-22 21:02:16.309370: step: 2076/530, loss: 0.00040686584543436766 2023-01-22 21:02:17.421030: step: 2080/530, loss: 1.979967964871321e-05 2023-01-22 21:02:18.510144: step: 2084/530, loss: 0.0017287888331338763 2023-01-22 21:02:19.591515: step: 2088/530, loss: 7.450580152834618e-10 2023-01-22 21:02:20.669741: step: 2092/530, loss: 9.442597729503177e-06 2023-01-22 21:02:21.752985: step: 2096/530, loss: 0.0002690191613510251 2023-01-22 21:02:22.820189: step: 2100/530, loss: 0.00023467732535209507 2023-01-22 21:02:23.928690: step: 2104/530, loss: 0.0056996820494532585 2023-01-22 21:02:25.045103: step: 2108/530, loss: 0.003091799793764949 2023-01-22 21:02:26.108866: step: 2112/530, loss: 0.013210326433181763 2023-01-22 21:02:27.204568: step: 2116/530, loss: 0.002925982465967536 2023-01-22 21:02:28.306329: step: 2120/530, loss: 2.0695311775398295e-07 ================================================== Loss: 0.003 -------------------- Dev Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34439964742752677, 'r': 0.35746984277582, 'f1': 0.35081304868316043}, 'combined': 0.2584938253454866, 'stategy': 1, 'epoch': 19} Test Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3329017636857124, 'r': 0.2868026074878887, 'f1': 0.30813755172184426}, 'combined': 0.1913696373851454, 'stategy': 1, 'epoch': 19} Dev Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.35111937125695253, 'r': 0.33846041859303966, 'f1': 0.34467370163967515}, 'combined': 0.2539700959450238, 'stategy': 1, 'epoch': 19} Test Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3227399871223643, 'r': 0.2885825404140626, 'f1': 0.30470699567479614}, 'combined': 0.1892390815243471, 'stategy': 1, 'epoch': 19} Dev Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3437452067669172, 'r': 0.32613397226462737, 'f1': 0.3347080883806399}, 'combined': 0.24662701249099783, 'stategy': 1, 'epoch': 19} Test Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3464304885346737, 'r': 0.2968427088332643, 'f1': 0.31972532062530223}, 'combined': 0.19856625175676668, 'stategy': 1, 'epoch': 19} Sample Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 19} Sample Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3870967741935484, 'r': 0.5217391304347826, 'f1': 0.4444444444444444}, 'combined': 0.2222222222222222, 'stategy': 1, 'epoch': 19} Sample Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 19} ================================================== Current best result: -------------------- Dev for Chinese: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.34038473737630043, 'r': 0.36363682569802114, 'f1': 0.35162680209698555}, 'combined': 0.2590934331240946, 'stategy': 1, 'epoch': 3} Test for Chinese: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.33394714661777014, 'r': 0.29100636614268593, 'f1': 0.31100151815037574}, 'combined': 0.19314831127233864, 'stategy': 1, 'epoch': 3} Chinese: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.3210227272727273, 'r': 0.4035714285714286, 'f1': 0.3575949367088607}, 'combined': 0.23839662447257381, 'stategy': 1, 'epoch': 3} -------------------- Dev for Korean: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3504253708142644, 'r': 0.3417811017049941, 'f1': 0.3460492614765262}, 'combined': 0.25498366635112457, 'stategy': 1, 'epoch': 4} Test for Korean: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.3179244390742019, 'r': 0.28710683766048106, 'f1': 0.3017307826140814}, 'combined': 0.18739069657085058, 'stategy': 1, 'epoch': 4} Korean: {'template': {'p': 0.5, 'r': 0.5, 'f1': 0.5}, 'slot': {'p': 0.3984375, 'r': 0.5543478260869565, 'f1': 0.4636363636363637}, 'combined': 0.23181818181818184, 'stategy': 1, 'epoch': 4} -------------------- Dev for Russian: {'template': {'p': 1.0, 'r': 0.5833333333333334, 'f1': 0.7368421052631579}, 'slot': {'p': 0.3447809032815958, 'r': 0.33562163829878294, 'f1': 0.34013962189126656}, 'combined': 0.25062919507777537, 'stategy': 1, 'epoch': 6} Test for Russian: {'template': {'p': 0.9516129032258065, 'r': 0.4609375, 'f1': 0.6210526315789474}, 'slot': {'p': 0.34636450813867986, 'r': 0.29610233370986844, 'f1': 0.3192673379969098}, 'combined': 0.1982818204401861, 'stategy': 1, 'epoch': 6} Russian: {'template': {'p': 1.0, 'r': 0.5, 'f1': 0.6666666666666666}, 'slot': {'p': 0.5514705882352942, 'r': 0.3232758620689655, 'f1': 0.4076086956521739}, 'combined': 0.2717391304347826, 'stategy': 1, 'epoch': 6}