diff --git a/extras/mmdeploy/configs/detection_onnxruntime_static-320x320.py b/extras/mmdeploy/configs/detection_onnxruntime_static-320x320.py index 89764dd..b9a9c4c 100644 --- a/extras/mmdeploy/configs/detection_onnxruntime_static-320x320.py +++ b/extras/mmdeploy/configs/detection_onnxruntime_static-320x320.py @@ -5,5 +5,14 @@ onnx_config = dict( ) codebase_config = dict( - post_processing=dict(score_threshold=0.3, iou_threshold=0.3), + # For later TensorRT inference, the number of output boxes needs to be as stable as possible, + # because a drop in the box count leads to a re-optimization which takes a lot of time, + # therefore sort out low confidence boxes outside the model and reduce the maximum number + # of output boxes to the smallest usable value. + post_processing=dict( + score_threshold=0.0, + confidence_threshold=0.0, + iou_threshold=0.3, + max_output_boxes_per_class=10, + ), ) diff --git a/extras/mmdeploy/configs/detection_onnxruntime_static-320x320_fp16.py b/extras/mmdeploy/configs/detection_onnxruntime_static-320x320_fp16.py index 62dff76..a5478be 100644 --- a/extras/mmdeploy/configs/detection_onnxruntime_static-320x320_fp16.py +++ b/extras/mmdeploy/configs/detection_onnxruntime_static-320x320_fp16.py @@ -5,5 +5,14 @@ onnx_config = dict( ) codebase_config = dict( - post_processing=dict(score_threshold=0.3, iou_threshold=0.3), + # For later TensorRT inference, the number of output boxes needs to be as stable as possible, + # because a drop in the box count leads to a re-optimization which takes a lot of time, + # therefore reduce the maximum number of output boxes to the smallest usable value and sort out + # low confidence boxes outside the model. + post_processing=dict( + score_threshold=0.0, + confidence_threshold=0.0, + iou_threshold=0.3, + max_output_boxes_per_class=10, + ), ) diff --git a/media/RESULTS.md b/media/RESULTS.md index fbe9ca9..577d94a 100644 --- a/media/RESULTS.md +++ b/media/RESULTS.md @@ -6,9 +6,9 @@ Results of the model in various experiments on different datasets. ```json { - "avg_time_2d": 0.016274028309321, - "avg_time_3d": 0.00032552096803309556, - "avg_fps": 60.24259956047411 + "avg_time_2d": 0.01254632634631658, + "avg_time_3d": 0.00036295955463991325, + "avg_fps": 77.4636186441503 } { "person_nums": { @@ -27,149 +27,149 @@ Results of the model in various experiments on different datasets. }, "mpjpe": { "count": 600, - "mean": 0.066064, - "median": 0.058463, - "std": 0.027791, - "sem": 0.001136, - "min": 0.040706, - "max": 0.189425, + "mean": 0.066275, + "median": 0.058426, + "std": 0.02768, + "sem": 0.001131, + "min": 0.040807, + "max": 0.188876, "recall-0.025": 0.0, - "recall-0.05": 0.085, - "recall-0.1": 0.936667, + "recall-0.05": 0.083333, + "recall-0.1": 0.938333, "recall-0.15": 0.95, "recall-0.25": 1.0, "recall-0.5": 1.0, "num_labels": 600, "ap-0.025": 0.0, - "ap-0.05": 0.012704, - "ap-0.1": 0.897461, - "ap-0.15": 0.915018, + "ap-0.05": 0.011533, + "ap-0.1": 0.899113, + "ap-0.15": 0.915362, "ap-0.25": 1.0, "ap-0.5": 1.0 }, "nose": { "count": 600, - "mean": 0.114664, - "median": 0.10192, - "std": 0.040958, - "sem": 0.001673, - "min": 0.027318, - "max": 0.26417, + "mean": 0.115024, + "median": 0.099737, + "std": 0.041, + "sem": 0.001675, + "min": 0.02644, + "max": 0.261025, "recall-0.025": 0.0, - "recall-0.05": 0.006667, - "recall-0.1": 0.488333, - "recall-0.15": 0.82, - "recall-0.25": 0.993333, + "recall-0.05": 0.008333, + "recall-0.1": 0.501667, + "recall-0.15": 0.808333, + "recall-0.25": 0.998333, "recall-0.5": 1.0, "num_labels": 600 }, "shoulder_left": { "count": 600, - "mean": 0.034211, - "median": 0.026464, - "std": 0.031942, - "sem": 0.001305, - "min": 0.001243, - "max": 0.178564, - "recall-0.025": 0.47, + "mean": 0.034317, + "median": 0.026768, + "std": 0.031799, + "sem": 0.001299, + "min": 0.001234, + "max": 0.178357, + "recall-0.025": 0.456667, "recall-0.05": 0.863333, "recall-0.1": 0.946667, - "recall-0.15": 0.965, + "recall-0.15": 0.966667, "recall-0.25": 1.0, "recall-0.5": 1.0, "num_labels": 600 }, "shoulder_right": { "count": 600, - "mean": 0.049177, - "median": 0.034548, - "std": 0.042414, - "sem": 0.001733, - "min": 0.004601, - "max": 0.249061, - "recall-0.025": 0.221667, - "recall-0.05": 0.73, - "recall-0.1": 0.908333, - "recall-0.15": 0.941667, + "mean": 0.047981, + "median": 0.034263, + "std": 0.039767, + "sem": 0.001625, + "min": 0.005363, + "max": 0.24597, + "recall-0.025": 0.226667, + "recall-0.05": 0.743333, + "recall-0.1": 0.916667, + "recall-0.15": 0.948333, "recall-0.25": 1.0, "recall-0.5": 1.0, "num_labels": 600 }, "elbow_left": { "count": 600, - "mean": 0.043333, - "median": 0.034664, - "std": 0.034544, - "sem": 0.001411, - "min": 0.002445, - "max": 0.200532, - "recall-0.025": 0.238333, - "recall-0.05": 0.796667, - "recall-0.1": 0.945, - "recall-0.15": 0.953333, + "mean": 0.043526, + "median": 0.034276, + "std": 0.034786, + "sem": 0.001421, + "min": 0.003312, + "max": 0.198715, + "recall-0.025": 0.24, + "recall-0.05": 0.781667, + "recall-0.1": 0.943333, + "recall-0.15": 0.958333, "recall-0.25": 1.0, "recall-0.5": 1.0, "num_labels": 600 }, "elbow_right": { "count": 600, - "mean": 0.043379, - "median": 0.033008, - "std": 0.037384, - "sem": 0.001527, - "min": 0.00441, - "max": 0.300237, - "recall-0.025": 0.241667, - "recall-0.05": 0.828333, - "recall-0.1": 0.93, - "recall-0.15": 0.94, + "mean": 0.04376, + "median": 0.033219, + "std": 0.037126, + "sem": 0.001517, + "min": 0.006159, + "max": 0.314756, + "recall-0.025": 0.245, + "recall-0.05": 0.803333, + "recall-0.1": 0.933333, + "recall-0.15": 0.943333, "recall-0.25": 0.996667, "recall-0.5": 1.0, "num_labels": 600 }, "wrist_left": { "count": 600, - "mean": 0.042137, - "median": 0.026475, - "std": 0.044455, - "sem": 0.001816, - "min": 0.000734, - "max": 0.289424, - "recall-0.025": 0.476667, - "recall-0.05": 0.738333, - "recall-0.1": 0.905, - "recall-0.15": 0.94, - "recall-0.25": 0.996667, + "mean": 0.044151, + "median": 0.026578, + "std": 0.047109, + "sem": 0.001925, + "min": 0.002328, + "max": 0.288425, + "recall-0.025": 0.478333, + "recall-0.05": 0.736667, + "recall-0.1": 0.883333, + "recall-0.15": 0.918333, + "recall-0.25": 0.998333, "recall-0.5": 1.0, "num_labels": 600 }, "wrist_right": { "count": 600, - "mean": 0.044742, - "median": 0.027623, - "std": 0.050977, - "sem": 0.002083, - "min": 0.001885, - "max": 0.455832, - "recall-0.025": 0.455, - "recall-0.05": 0.753333, - "recall-0.1": 0.893333, - "recall-0.15": 0.911667, - "recall-0.25": 0.996667, + "mean": 0.045218, + "median": 0.026994, + "std": 0.050213, + "sem": 0.002052, + "min": 0.002207, + "max": 0.291549, + "recall-0.025": 0.471667, + "recall-0.05": 0.766667, + "recall-0.1": 0.876667, + "recall-0.15": 0.908333, + "recall-0.25": 0.998333, "recall-0.5": 1.0, "num_labels": 600 }, "hip_left": { "count": 600, - "mean": 0.084994, - "median": 0.079686, - "std": 0.033001, - "sem": 0.001348, - "min": 0.010753, - "max": 0.232419, - "recall-0.025": 0.005, - "recall-0.05": 0.041667, - "recall-0.1": 0.855, + "mean": 0.085085, + "median": 0.079726, + "std": 0.032918, + "sem": 0.001345, + "min": 0.020039, + "max": 0.232252, + "recall-0.025": 0.006667, + "recall-0.05": 0.055, + "recall-0.1": 0.853333, "recall-0.15": 0.95, "recall-0.25": 1.0, "recall-0.5": 1.0, @@ -177,98 +177,98 @@ Results of the model in various experiments on different datasets. }, "hip_right": { "count": 600, - "mean": 0.108772, - "median": 0.107197, - "std": 0.025158, - "sem": 0.001028, - "min": 0.051859, - "max": 0.227885, + "mean": 0.108514, + "median": 0.106487, + "std": 0.025557, + "sem": 0.001044, + "min": 0.043182, + "max": 0.228959, "recall-0.025": 0.0, - "recall-0.05": 0.0, - "recall-0.1": 0.351667, - "recall-0.15": 0.946667, + "recall-0.05": 0.003333, + "recall-0.1": 0.358333, + "recall-0.15": 0.948333, "recall-0.25": 1.0, "recall-0.5": 1.0, "num_labels": 600 }, "knee_left": { - "count": 599, - "mean": 0.060126, - "median": 0.044568, - "std": 0.057251, - "sem": 0.002341, - "min": 0.015543, - "max": 0.407951, - "recall-0.025": 0.05, - "recall-0.05": 0.586667, - "recall-0.1": 0.918333, - "recall-0.15": 0.923333, + "count": 600, + "mean": 0.063226, + "median": 0.046357, + "std": 0.059854, + "sem": 0.002446, + "min": 0.016702, + "max": 0.474089, + "recall-0.025": 0.035, + "recall-0.05": 0.563333, + "recall-0.1": 0.881667, + "recall-0.15": 0.925, "recall-0.25": 0.98, - "recall-0.5": 0.998333, + "recall-0.5": 1.0, "num_labels": 600 }, "knee_right": { "count": 600, - "mean": 0.050346, - "median": 0.041731, - "std": 0.03615, - "sem": 0.001477, - "min": 0.01555, - "max": 0.278599, - "recall-0.025": 0.035, - "recall-0.05": 0.756667, - "recall-0.1": 0.946667, - "recall-0.15": 0.946667, + "mean": 0.050723, + "median": 0.041264, + "std": 0.036826, + "sem": 0.001505, + "min": 0.013747, + "max": 0.274, + "recall-0.025": 0.043333, + "recall-0.05": 0.745, + "recall-0.1": 0.945, + "recall-0.15": 0.945, "recall-0.25": 0.996667, "recall-0.5": 1.0, "num_labels": 600 }, "ankle_left": { - "count": 599, - "mean": 0.097233, - "median": 0.085626, - "std": 0.047643, - "sem": 0.001948, - "min": 0.050047, - "max": 0.497687, + "count": 600, + "mean": 0.097084, + "median": 0.085682, + "std": 0.046353, + "sem": 0.001894, + "min": 0.045955, + "max": 0.492226, "recall-0.025": 0.0, - "recall-0.05": 0.0, - "recall-0.1": 0.84, - "recall-0.15": 0.935, + "recall-0.05": 0.001667, + "recall-0.1": 0.833333, + "recall-0.15": 0.933333, "recall-0.25": 0.985, - "recall-0.5": 0.998333, + "recall-0.5": 1.0, "num_labels": 600 }, "ankle_right": { "count": 599, - "mean": 0.082942, - "median": 0.068818, - "std": 0.053498, - "sem": 0.002188, - "min": 0.02884, - "max": 0.443019, + "mean": 0.082224, + "median": 0.068812, + "std": 0.047465, + "sem": 0.001941, + "min": 0.029154, + "max": 0.404964, "recall-0.025": 0.0, "recall-0.05": 0.026667, - "recall-0.1": 0.896667, - "recall-0.15": 0.911667, - "recall-0.25": 0.978333, + "recall-0.1": 0.888333, + "recall-0.15": 0.91, + "recall-0.25": 0.985, "recall-0.5": 0.998333, "num_labels": 600 }, "joint_recalls": { "num_labels": 7800, - "recall-0.025": 0.16859, - "recall-0.05": 0.4709, - "recall-0.1": 0.83218, - "recall-0.15": 0.92923, - "recall-0.25": 0.99385, - "recall-0.5": 0.99923 + "recall-0.025": 0.16923, + "recall-0.05": 0.46833, + "recall-0.1": 0.82692, + "recall-0.15": 0.92692, + "recall-0.25": 0.99487, + "recall-0.5": 0.99974 } } { "total_parts": 8400, - "correct_parts": 8091, - "pcp": 0.963214 + "correct_parts": 8097, + "pcp": 0.963929 } ```