{ "overall_accuracy": 0.9827222924568058, "class_metrics": { "class_0_same_paragraph": { "precision": 0.995013061030634, "recall": 0.9856504351917196, "f1_score": 0.9903096194753014, "support": 4251 }, "class_1_different_paragraph": { "precision": 0.8859813084112149, "recall": 0.9575757575757575, "f1_score": 0.920388349514563, "support": 495 } }, "confusion_matrix": [ [ 4190, 61 ], [ 21, 474 ] ], "classification_report": { "Same Paragraph (0)": { "precision": 0.995013061030634, "recall": 0.9856504351917196, "f1-score": 0.9903096194753014, "support": 4251.0 }, "Different Paragraph (1)": { "precision": 0.8859813084112149, "recall": 0.9575757575757575, "f1-score": 0.920388349514563, "support": 495.0 }, "accuracy": 0.9827222924568058, "macro avg": { "precision": 0.9404971847209245, "recall": 0.9716130963837386, "f1-score": 0.9553489844949322, "support": 4746.0 }, "weighted avg": { "precision": 0.9836412284249424, "recall": 0.9827222924568058, "f1-score": 0.9830169459332522, "support": 4746.0 } }, "test_samples_count": 4746, "boundary_score_stats": { "mean": 0.14779670536518097, "std": 0.29127171635627747, "min": 0.042458675801754, "max": 0.9999679327011108 }, "evaluation_info": { "evaluation_time": "0:01:19.859698", "device_used": "cuda", "model_type": "DualPathBoundaryClassifier", "max_length": 384, "batch_size": 32, "test_file": "D:\\workstation\\AI标注\\数据清洗+json\\test_dataset.json", "trained_model_path": "D:\\workstation\\chinese-roberta-wwm-ext\\model-train-eval-NN\\model_train" } }