Merge branch 'cpp' into 'master'

Convert to cpp for faster runtime See merge request Percipiote/SimplePoseTriangulation!1
2024-10-09 08:30:16 +00:00
parent 7b426d209c fa2af31349
commit 35ac5711bf
32 changed files with 10790 additions and 3393 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,3 +1,40 @@
 spt_wrap.*
 spt.py
 *.bin
 # Prerequisites
 *.d
 # Compiled Object files
 *.slo
 *.lo
 *.o
 *.obj
 # Precompiled Headers
 *.gch
 *.pch
 # Compiled Dynamic libraries
 *.so
 *.dylib
 *.dll
 # Fortran module files
 *.mod
 *.smod
 # Compiled Static libraries
 *.lai
 *.la
 *.a
 *.lib
 # Executables
 *.exe
 *.out
 *.app
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
--- a/5
+++ b/5
@ -37,6 +37,11 @@ RUN python3 -c "from utils_2d_pose import load_wb_model; load_wb_model();"
 # Fix an undefined symbol error with ompi
 RUN echo "ldconfig" >> ~/.bashrc
 # Install swig and later dependencies
 RUN apt-get update && apt-get install -y --no-install-recommends build-essential
 RUN apt-get update && apt-get install -y --no-install-recommends swig
 RUN apt-get update && apt-get install -y --no-install-recommends libopencv-dev
 COPY ./skelda/ /skelda/
 RUN pip3 install --no-cache-dir -e /skelda/
--- a/README.md
+++ b/README.md
@ -34,3 +34,11 @@ Triangulation of multiple persons from multiple camera views.
  export CUDA_VISIBLE_DEVICES=0
  python3 /SimplePoseTriangulation/scripts/test_skelda_dataset.py
  ```
 <br>
 ## Debugging
 ```bash
 cd /SimplePoseTriangulation/swig/ && make all && cd ../tests/ && python3 test_interface.py
 ```
--- a/data/e1/README.md
+++ b/data/e1/README.md
@ -0,0 +1,12 @@
 Image source:
 ```bash 
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam01/images/00002.jpg' ./c1_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam02/images/00002.jpg' ./c2_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam03/images/00002.jpg' ./c3_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam04/images/00002.jpg' ./c4_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam05/images/00002.jpg' ./c5_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam06/images/00002.jpg' ./c6_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam07/images/00002.jpg' ./c7_00002.jpg
 cp '/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam08/images/00002.jpg' ./c8_00002.jpg
 ```
--- a/data/e1/c1_00002.jpg
+++ b/data/e1/c1_00002.jpg
--- a/data/e1/c2_00002.jpg
+++ b/data/e1/c2_00002.jpg
--- a/data/e1/c3_00002.jpg
+++ b/data/e1/c3_00002.jpg
--- a/data/e1/c4_00002.jpg
+++ b/data/e1/c4_00002.jpg
--- a/data/e1/c5_00002.jpg
+++ b/data/e1/c5_00002.jpg
--- a/data/e1/c6_00002.jpg
+++ b/data/e1/c6_00002.jpg
--- a/data/e1/c7_00002.jpg
+++ b/data/e1/c7_00002.jpg
--- a/data/e1/c8_00002.jpg
+++ b/data/e1/c8_00002.jpg
--- a/data/e1/sample.json
+++ b/data/e1/sample.json
@ -0,0 +1,483 @@
 {
    "id": "006_legoassemble-000002",
    "imgpaths": [
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam01/images/c1_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam02/images/c2_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam03/images/c3_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam04/images/c4_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam05/images/c5_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam06/images/c6_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam07/images/c7_00002.jpg",
        "/datasets/egohumans/02_legoassemble/006_legoassemble/exo/cam08/images/c8_00002.jpg"
    ],
    "dataset_name": "egohumans",
    "room_size": [
        6.0,
        5.0,
        2.0
    ],
    "room_center": [
        1.5,
        1.0,
        -0.5
    ],
    "num_persons": 3,
    "cameras": [
        {
            "type": "fisheye",
            "name": "cam01",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1905.440429,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1908.738384,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.022721,
                0.096403,
                -0.122399,
                0.06457
            ],
            "R": [
                [
                    -1.320967,
                    1.091159,
                    -0.053999
                ],
                [
                    0.324639,
                    0.311149,
                    -1.654174
                ],
                [
                    -1.043145,
                    -1.284934,
                    -0.446418
                ]
            ],
            "T": [
                [
                    1.938363
                ],
                [
                    2.912456
                ],
                [
                    -0.05983
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam02",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1932.244518,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1936.559524,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.038159,
                0.063352,
                -0.103183,
                0.057205
            ],
            "R": [
                [
                    -0.559664,
                    1.606496,
                    -0.210818
                ],
                [
                    0.354514,
                    -0.096222,
                    -1.674383
                ],
                [
                    -1.58101,
                    -0.590262,
                    -0.300823
                ]
            ],
            "T": [
                [
                    3.363792
                ],
                [
                    2.221809
                ],
                [
                    -0.150734
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam03",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1894.357534,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1895.186619,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.050168,
                0.041318,
                -0.141156,
                0.109365
            ],
            "R": [
                [
                    1.33355,
                    1.075326,
                    -0.06178
                ],
                [
                    0.254785,
                    -0.410461,
                    -1.64472
                ],
                [
                    -1.046531,
                    1.270312,
                    -0.479142
                ]
            ],
            "T": [
                [
                    3.350025
                ],
                [
                    -0.796138
                ],
                [
                    -0.123788
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam04",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1954.001155,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1961.448327,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.002428,
                0.182701,
                -0.217826,
                0.085325
            ],
            "R": [
                [
                    -1.267021,
                    -1.154138,
                    -0.033506
                ],
                [
                    -0.150745,
                    0.214669,
                    -1.694016
                ],
                [
                    1.144741,
                    -1.249152,
                    -0.260162
                ]
            ],
            "T": [
                [
                    -0.017013
                ],
                [
                    3.310275
                ],
                [
                    -0.109274
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam05",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1935.020765,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1932.219587,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.058948,
                -0.009451,
                0.031702,
                -0.02819
            ],
            "R": [
                [
                    1.702269,
                    0.12581,
                    -0.157957
                ],
                [
                    -0.14946,
                    -0.116741,
                    -1.703681
                ],
                [
                    -0.135795,
                    1.705591,
                    -0.104959
                ]
            ],
            "T": [
                [
                    1.404604
                ],
                [
                    -1.586799
                ],
                [
                    -0.106577
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam06",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1922.984553,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1913.40327,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.051617,
                -0.019883,
                0.131883,
                -0.148917
            ],
            "R": [
                [
                    0.859208,
                    -1.483123,
                    -0.024598
                ],
                [
                    -0.452399,
                    -0.234941,
                    -1.636654
                ],
                [
                    1.412655,
                    0.826829,
                    -0.509173
                ]
            ],
            "T": [
                [
                    -1.069183
                ],
                [
                    0.162843
                ],
                [
                    -0.081835
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam07",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1921.007178,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1922.985943,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                0.012135,
                0.192931,
                -0.334768,
                0.182519
            ],
            "R": [
                [
                    -0.069061,
                    1.712667,
                    -0.022347
                ],
                [
                    0.123643,
                    -0.017322,
                    -1.709652
                ],
                [
                    -1.708344,
                    -0.07049,
                    -0.122835
                ]
            ],
            "T": [
                [
                    4.379272
                ],
                [
                    1.482245
                ],
                [
                    -0.111096
                ]
            ]
        },
        {
            "type": "fisheye",
            "name": "cam08",
            "width": 3840,
            "height": 2160,
            "K": [
                [
                    1944.872901,
                    0.0,
                    1920.0
                ],
                [
                    0.0,
                    1952.784761,
                    1080.0
                ],
                [
                    0.0,
                    0.0,
                    1.0
                ]
            ],
            "DC": [
                -0.011357,
                0.225262,
                -0.308,
                0.148322
            ],
            "R": [
                [
                    -0.32595,
                    -1.682675,
                    -0.029302
                ],
                [
                    -0.137145,
                    0.056305,
                    -1.707782
                ],
                [
                    1.677333,
                    -0.322385,
                    -0.145329
                ]
            ],
            "T": [
                [
                    -1.092642
                ],
                [
                    1.923018
                ],
                [
                    -0.068911
                ]
            ]
        }
    ]
 }
--- a/media/2d-k.png
+++ b/media/2d-k.png
--- a/media/2d-p.png
+++ b/media/2d-p.png
--- a/media/3d-p.png
+++ b/media/3d-p.png
--- a/media/RESULTS.md
+++ b/media/RESULTS.md
--- a/scripts/test_skelda_dataset.py
+++ b/scripts/test_skelda_dataset.py
@ -1,5 +1,6 @@
 import json
 import os
 import sys
 import time
 import cv2
@ -8,10 +9,12 @@ import numpy as np
 import tqdm
 import test_triangulate
 import triangulate_poses
 import utils_2d_pose
 from skelda import evals, utils_pose
 sys.path.append("/SimplePoseTriangulation/swig/")
 import spt
 # ==================================================================================================
 # dataset_use = "panoptic"
@ -185,111 +188,6 @@ def load_labels(dataset: dict):
 # ==================================================================================================
 def add_extra_joints(poses3D, poses2D, joint_names_3d):
    # Update "head" joint as average of "ear" joints
    idx_h = joint_names_3d.index("head")
    idx_el = joint_names_3d.index("ear_left")
    idx_er = joint_names_3d.index("ear_right")
    for i in range(len(poses3D)):
        if poses3D[i, idx_h, 3] == 0:
            ear_left = poses3D[i, idx_el]
            ear_right = poses3D[i, idx_er]
            if ear_left[3] > 0.1 and ear_right[3] > 0.1:
                head = (ear_left + ear_right) / 2
                head[3] = min(ear_left[3], ear_right[3])
                poses3D[i, idx_h] = head
            for j in range(len(poses2D)):
                ear_left = poses2D[j][i, idx_el]
                ear_right = poses2D[j][i, idx_er]
                if ear_left[2] > 0.1 and ear_right[2] > 0.1:
                    head = (ear_left + ear_right) / 2
                    head[2] = min(ear_left[2], ear_right[2])
                    poses2D[j][i, idx_h] = head
    return poses3D, poses2D
 # ==================================================================================================
 def add_missing_joints(poses3D, joint_names_3d):
    """Replace missing joints with their nearest adjacent joints"""
    adjacents = {
        "hip_right": ["hip_middle", "hip_left"],
        "hip_left": ["hip_middle", "hip_right"],
        "knee_right": ["hip_right", "knee_left"],
        "knee_left": ["hip_left", "knee_right"],
        "ankle_right": ["knee_right", "ankle_left"],
        "ankle_left": ["knee_left", "ankle_right"],
        "shoulder_right": ["shoulder_middle", "shoulder_left"],
        "shoulder_left": ["shoulder_middle", "shoulder_right"],
        "elbow_right": ["shoulder_right", "hip_right"],
        "elbow_left": ["shoulder_left", "hip_left"],
        "wrist_right": ["elbow_right"],
        "wrist_left": ["elbow_left"],
        "nose": ["shoulder_middle", "shoulder_right", "shoulder_left"],
        "head": ["shoulder_middle", "shoulder_right", "shoulder_left"],
        "foot_*_left_*": ["ankle_left"],
        "foot_*_right_*": ["ankle_right"],
        "face_*": ["nose"],
        "hand_*_left_*": ["wrist_left"],
        "hand_*_right_*": ["wrist_right"],
    }
    for i in range(len(poses3D)):
        valid_joints = np.where(poses3D[i, :, 3] > 0.1)[0]
        if len(valid_joints) == 0:
            continue
        body_center = np.mean(poses3D[i, valid_joints, :3], axis=0)
        for j in range(len(joint_names_3d)):
            adname = ""
            if joint_names_3d[j][0:5] == "foot_" and "_left" in joint_names_3d[j]:
                adname = "foot_*_left_*"
            elif joint_names_3d[j][0:5] == "foot_" and "_right" in joint_names_3d[j]:
                adname = "foot_*_right_*"
            elif joint_names_3d[j][0:5] == "face_":
                adname = "face_*"
            elif joint_names_3d[j][0:5] == "hand_" and "_left" in joint_names_3d[j]:
                adname = "hand_*_left_*"
            elif joint_names_3d[j][0:5] == "hand_" and "_right" in joint_names_3d[j]:
                adname = "hand_*_right_*"
            elif joint_names_3d[j] in adjacents:
                adname = joint_names_3d[j]
            if adname == "":
                continue
            if poses3D[i, j, 3] == 0:
                if joint_names_3d[j] in adjacents or joint_names_3d[j][0:5] in [
                    "foot_",
                    "face_",
                    "hand_",
                ]:
                    adjacent_joints = [
                        poses3D[i, joint_names_3d.index(a), :]
                        for a in adjacents[adname]
                    ]
                    adjacent_joints = [a[0:3] for a in adjacent_joints if a[3] > 0.1]
                    if len(adjacent_joints) > 0:
                        poses3D[i, j, :3] = np.mean(adjacent_joints, axis=0)
                    else:
                        poses3D[i, j, :3] = body_center
                else:
                    poses3D[i, j, :3] = body_center
                poses3D[i, j, 3] = 0.1
    return poses3D
 # ==================================================================================================
 def main():
    global joint_names_3d, eval_joints
@ -316,20 +214,44 @@ def main():
    # Print a dataset sample for debugging
    print(labels[0])
    minscores = {
        # Choose this depending on the fraction of invalid/missing persons
        # A higher value reduces the number of proposals
        "panoptic": 0.94,
        "human36m": 0.94,
        "mvor": 0.86,
        "campus": 0.96,
        "shelf": 0.96,
        "ikeaasm": 0.89,
        "tsinghua": 0.96,
        "human36m_wb": 0.94,
        "koarob": 0.91,
    }
    minscore = minscores.get(dataset_use, 0.95)
    min_group_sizes = {
        # If the number of cameras is high, and the views are not occluded, use a higher value
        "panoptic": 1,
        "shelf": 2,
        "tsinghua": 2,
    }
    min_group_size = min_group_sizes.get(dataset_use, 1)
    if dataset_use == "panoptic" and len(datasets["panoptic"]["cams"]) == 10:
        min_group_size = 4
    print("\nRunning predictions ...")
    all_poses = []
    all_ids = []
    all_paths = []
    times = []
-    last_poses_3d = np.array([])
+    triangulator = spt.Triangulator(min_score=minscore, min_group_size=min_group_size)
    old_scene = ""
    for label in tqdm.tqdm(labels):
        images_2d = []
-        if old_scene != label.get("scene", ""):
+        if old_scene != label.get("scene", "") or dataset_use == "human36m_wb":
            # Reset last poses if scene changes
            old_scene = label.get("scene", "")
-            last_poses_3d = np.array([])
+            triangulator.reset()
        try:
            start = time.time()
@ -355,62 +277,34 @@ def main():
                    cam["K"][0][2] = cam["K"][0][2] * (1000 / ishape[1])
                    images_2d[i] = cv2.resize(img, (1000, 1000))
        roomparams = {
            "room_size": label["room_size"],
            "room_center": label["room_center"],
        }
        start = time.time()
        poses_2d = utils_2d_pose.get_2d_pose(kpt_model, images_2d)
        poses_2d = test_triangulate.update_keypoints(poses_2d, joint_names_2d)
        time_2d = time.time() - start
        print("2D time:", time_2d)
        minscores = {
            # Choose this depending on the fraction of invalid/missing persons
            # A higher value reduces the number of proposals
            "panoptic": 0.94,
            "human36m": 0.94,
            "mvor": 0.86,
            "campus": 0.96,
            "shelf": 0.96,
            "ikeaasm": 0.89,
            "tsinghua": 0.96,
            "human36m_wb": 0.94,
        }
        minscore = minscores.get(dataset_use, 0.95)
        start = time.time()
        if sum(np.sum(p) for p in poses_2d) == 0:
-            poses3D = np.zeros([1, len(joint_names_3d), 4])
+            poses3D = np.zeros([1, len(joint_names_3d), 4]).tolist()
            poses2D = np.zeros([len(images_2d), 1, len(joint_names_3d), 3])
        else:
-            poses3D = triangulate_poses.get_3d_pose(
+            spt_cameras = spt.convert_cameras(label["cameras"])
-                poses_2d, label["cameras"], roomparams, joint_names_2d, last_poses_3d, minscore
+            roomparams = [label["room_size"], label["room_center"]]
            poses3D = triangulator.triangulate_poses(
                poses_2d, spt_cameras, roomparams, joint_names_2d
            )
            poses2D = []
            for cam in label["cameras"]:
                poses_2d, _ = utils_pose.project_poses(poses3D, cam)
                poses2D.append(poses_2d)
            poses3D, poses2D = add_extra_joints(poses3D, poses2D, joint_names_3d)
            poses3D, poses2D = test_triangulate.filter_poses(
                poses3D,
                poses2D,
                roomparams,
                joint_names_3d,
                drop_few_limbs=(dataset_use != "mvor"),
            )
            poses3D = add_missing_joints(poses3D, joint_names_3d)
        last_poses_3d = poses3D
        time_3d = time.time() - start
        print("3D time:", time_3d)
-        all_poses.append(poses3D)
+        all_poses.append(np.array(poses3D))
        all_ids.append(label["id"])
        all_paths.append(label["imgpaths"])
        times.append((time_2d, time_3d))
    # Print per-step triangulation timings
    print("")
    triangulator.print_stats()
    warmup_iters = 10
    if len(times) > warmup_iters:
        times = times[warmup_iters:]
--- a/scripts/test_triangulate.py
+++ b/scripts/test_triangulate.py
@ -1,6 +1,8 @@
 import copy
 import json
 import os
 import sys
 import time
 from typing import List
 import cv2
@ -8,10 +10,12 @@ import matplotlib
 import numpy as np
 import draw_utils
 import triangulate_poses
 import utils_2d_pose
 from skelda import utils_pose
 sys.path.append("/SimplePoseTriangulation/swig/")
 import spt
 # ==================================================================================================
 filepath = os.path.dirname(os.path.realpath(__file__)) + "/"
@ -224,124 +228,6 @@ def load_image(path: str):
 # ==================================================================================================
 def filter_poses(poses3D, poses2D, roomparams, joint_names, drop_few_limbs=True):
    drop = []
    for i, pose in enumerate(poses3D):
        pose = np.array(pose)
        valid_joints = [j for j in pose if j[-1] > 0.1]
        # Drop persons with too few joints
        if np.sum(pose[..., -1] > 0.1) < 5:
            drop.append(i)
            continue
        # Drop too large or too small persons
        mins = np.min(valid_joints, axis=0)
        maxs = np.max(valid_joints, axis=0)
        diff = maxs - mins
        if any(((d > 2.3) for d in diff)):
            drop.append(i)
            continue
        if all(((d < 0.3) for d in diff)):
            drop.append(i)
            continue
        if (
            (diff[0] < 0.2 and diff[1] < 0.2)
            or (diff[1] < 0.2 and diff[2] < 0.2)
            or (diff[2] < 0.2 and diff[0] < 0.2)
        ):
            drop.append(i)
            continue
        # Drop persons outside room
        mean = np.mean(valid_joints, axis=0)
        mins = np.min(valid_joints, axis=0)
        maxs = np.max(valid_joints, axis=0)
        rsize = [r / 2 for r in roomparams["room_size"]]
        rcent = roomparams["room_center"]
        if any(
            (
                # Center of mass outside room
                mean[j] > rsize[j] + rcent[j] or mean[j] < -rsize[j] + rcent[j]
                for j in range(3)
            )
        ) or any(
            (
                # One limb more than 10cm outside room
                maxs[j] > rsize[j] + rcent[j] + 0.1
                or mins[j] < -rsize[j] + rcent[j] - 0.1
                for j in range(3)
            )
        ):
            drop.append(i)
            continue
        if drop_few_limbs:
            # Drop persons with less than 3 limbs
            found_limbs = 0
            for limb in main_limbs:
                start_idx = joint_names.index(limb[0])
                end_idx = joint_names.index(limb[1])
                if pose[start_idx, -1] > 0.1 and pose[end_idx, -1] > 0.1:
                    found_limbs += 1
            if found_limbs < 3:
                drop.append(i)
                continue
        # Drop persons with too small or high average limb length
        total_length = 0
        total_limbs = 0
        for limb in main_limbs:
            start_idx = joint_names.index(limb[0])
            end_idx = joint_names.index(limb[1])
            if pose[start_idx, -1] < 0.1 or pose[end_idx, -1] < 0.1:
                continue
            limb_length = np.linalg.norm(pose[end_idx, :3] - pose[start_idx, :3])
            total_length += limb_length
            total_limbs += 1
        if total_limbs == 0:
            drop.append(i)
            continue
        average_length = total_length / total_limbs
        if average_length < 0.1:
            drop.append(i)
            continue
        if total_limbs > 4 and average_length > 0.5:
            drop.append(i)
            continue
    new_poses3D = []
    new_poses2D = [[] for _ in range(len(poses2D))]
    for i in range(len(poses3D)):
        if len(poses3D[i]) != len(joint_names):
            # Sometimes some joints of a poor detection are missing
            continue
        if i not in drop:
            new_poses3D.append(poses3D[i])
            for j in range(len(poses2D)):
                new_poses2D[j].append(poses2D[j][i])
        else:
            new_pose = np.array(poses3D[i])
            new_pose[..., -1] = 0.001
            new_poses3D.append(new_pose)
            for j in range(len(poses2D)):
                new_pose = np.array(poses2D[j][i])
                new_pose[..., -1] = 0.001
                new_poses2D[j].append(new_pose)
    new_poses3D = np.array(new_poses3D)
    new_poses2D = np.array(new_poses2D)
    if new_poses3D.size == 0:
        new_poses3D = np.zeros([1, len(joint_names), 4])
        new_poses2D = np.zeros([len(poses2D), 1, len(joint_names), 3])
    return new_poses3D, new_poses2D
 # ==================================================================================================
 def update_keypoints(poses_2d: list, joint_names: List[str]) -> list:
    new_views = []
    for view in poses_2d:
@ -409,10 +295,11 @@ def main():
        if not os.path.isdir(dirpath):
            continue
-        if (dirname[0] not in ["p", "h"]) or len(dirname) != 2:
+        if (dirname[0] not in ["p", "h", "e"]) or len(dirname) != 2:
            continue
        # Load sample infos
        print("\n" + dirpath)
        with open(os.path.join(dirpath, "sample.json"), "r", encoding="utf-8") as file:
            sample = json.load(file)
        sample = update_sample(sample, dirpath)
@ -431,8 +318,11 @@ def main():
            images_2d.append(img)
        # Get 2D poses
        stime = time.time()
        poses_2d = utils_2d_pose.get_2d_pose(kpt_model, images_2d)
        poses_2d = update_keypoints(poses_2d, joint_names_2d)
        print("2D time:", time.time() - stime)
        # print([np.array(p).round(6).tolist() for p in poses_2d])
        fig1 = draw_utils.show_poses2d(
            poses_2d, np.array(images_2d), joint_names_2d, "2D detections"
@ -449,23 +339,27 @@ def main():
            poses3D = np.zeros([1, len(joint_names_3d), 4])
            poses2D = np.zeros([len(images_2d), 1, len(joint_names_3d), 3])
        else:
-            poses3D = triangulate_poses.get_3d_pose(
+            cameras = spt.convert_cameras(camparams)
-                poses_2d, camparams, roomparams, joint_names_2d
+            roomp = [roomparams["room_size"], roomparams["room_center"]]
            triangulator = spt.Triangulator(min_score=0.95)
            stime = time.time()
            poses_3d = triangulator.triangulate_poses(
                poses_2d, cameras, roomp, joint_names_2d
            )
            poses3D = np.array(poses_3d)
            if len(poses3D) == 0:
                poses3D = np.zeros([1, len(joint_names_3d), 4])
            print("3D time:", time.time() - stime)
            poses2D = []
            for cam in camparams:
                poses_2d, _ = utils_pose.project_poses(poses3D, cam)
                poses2D.append(poses_2d)
            poses3D, poses2D = filter_poses(
                poses3D,
                poses2D,
                roomparams,
                joint_names_3d,
            )
        print("\n" + dirpath)
        print(poses3D)
        # print(poses2D)
        # print(poses3D.round(3).tolist())
        fig2 = draw_utils.utils_view.show_poses3d(
            poses3D, joint_names_3d, roomparams, camparams
--- a/scripts/triangulate_poses.py
+++ b/scripts/triangulate_poses.py
@ -1,456 +0,0 @@
 import copy
 import math
 import cv2
 import numpy as np
 from skelda import utils_pose
 # ==================================================================================================
 core_joints = [
    "shoulder_left",
    "shoulder_right",
    "hip_left",
    "hip_right",
    "elbow_left",
    "elbow_right",
    "knee_left",
    "knee_right",
    "wrist_left",
    "wrist_right",
    "ankle_left",
    "ankle_right",
 ]
 # ==================================================================================================
 def undistort_points(points: np.ndarray, caminfo: dict):
    """Undistorts 2D pixel coordinates"""
    K = np.asarray(caminfo["K"], dtype=np.float32)
    DC = np.asarray(caminfo["DC"][0:5], dtype=np.float32)
    # Undistort camera matrix
    w = caminfo["width"]
    h = caminfo["height"]
    newK, _ = cv2.getOptimalNewCameraMatrix(K, DC, (w, h), 1, (w, h))
    caminfo["K"] = newK
    caminfo["DC"] = np.array([0.0, 0.0, 0.0, 0.0, 0.0])
    # Undistort points
    pshape = points.shape
    points = np.reshape(points, (-1, 1, 2))
    points = cv2.undistortPoints(points, K, DC, P=newK)
    points = points.reshape(pshape)
    return points, caminfo
 # ==================================================================================================
 def get_camera_P(cam):
    """Calculate opencv-style projection matrix"""
    R = np.asarray(cam["R"])
    T = np.asarray(cam["T"])
    K = np.asarray(cam["K"])
    Tr = R @ (T * -1)
    P = K @ np.hstack([R, Tr])
    return P
 # ==================================================================================================
 def calc_pose_score(pose1, pose2, dist1, cam1, joint_names, use_joints):
    """Calculates the score between two poses"""
    # Select core joints
    jids = [joint_names.index(j) for j in use_joints]
    pose1 = pose1[jids]
    pose2 = pose2[jids]
    dist1 = dist1[jids]
    mask = (pose1[:, 2] > 0.1) & (pose2[:, 2] > 0.1)
    if np.sum(mask) < 3:
        return 0.0
    iscale = (cam1["width"] + cam1["height"]) / 2
    scores = score_projection(pose1, pose2, dist1, mask, iscale)
    score = np.mean(scores)
    return score
 # ==================================================================================================
 def calc_pair_score(pair, poses_2d, camparams, roomparams, joint_names_2d, use_joints):
    """Triangulates a pair of persons and scores them based on the reprojection error"""
    cam1 = camparams[pair[0][0]]
    cam2 = camparams[pair[0][1]]
    pose1 = poses_2d[pair[0][0]][pair[0][2]]
    pose2 = poses_2d[pair[0][1]][pair[0][3]]
    # Select core joints
    jids = [joint_names_2d.index(j) for j in use_joints]
    pose1 = pose1[jids]
    pose2 = pose2[jids]
    poses_3d, score = triangulate_and_score(pose1, pose2, cam1, cam2, roomparams)
    return poses_3d, score
 # ==================================================================================================
 def score_projection(pose1, repro1, dists1, mask, iscale):
    min_score = 0.1
    error1 = np.linalg.norm(pose1[mask, 0:2] - repro1[mask, 0:2], axis=1)
    # Set errors of invisible reprojections to a high value
    penalty = iscale
    mask1b = (repro1[:, 2] < min_score)[mask]
    error1[mask1b] = penalty
    # Scale error by image size and distance to the camera
    error1 = error1.clip(0, iscale / 4) / iscale
    dscale1 = np.sqrt(np.mean(dists1[mask]) / 3.5)
    error1 = error1 * dscale1
    # Convert errors to a score
    score1 = 1.0 / (1.0 + error1 * 10)
    return score1
 # ==================================================================================================
 def triangulate_and_score(pose1, pose2, cam1, cam2, roomparams):
    """Triangulates a pair of persons and scores them based on the reprojection error"""
    # Mask out invisible joints
    min_score = 0.1
    mask1a = pose1[:, 2] >= min_score
    mask2a = pose2[:, 2] >= min_score
    mask = mask1a & mask2a
    # If too few joints are visible return a low score
    if np.sum(mask) < 3:
        pose3d = np.zeros([len(pose1), 4])
        score = 0.0
        return pose3d, score
    # Triangulate points
    points1 = pose1[mask, 0:2].T
    points2 = pose2[mask, 0:2].T
    points3d = cv2.triangulatePoints(cam1["P"], cam2["P"], points1, points2)
    points3d = (points3d / points3d[3, :])[0:3, :].T
    pose3d = np.zeros([len(pose1), 4])
    pose3d[mask] = np.concatenate([points3d, np.ones([points3d.shape[0], 1])], axis=-1)
    # If the triangulated points are outside the room drop it
    mean = np.mean(pose3d[mask][:, 0:3], axis=0)
    mins = np.min(pose3d[mask][:, 0:3], axis=0)
    maxs = np.max(pose3d[mask][:, 0:3], axis=0)
    rsize = np.array(roomparams["room_size"]) / 2
    rcent = np.array(roomparams["room_center"])
    wdist = 0.1
    center_outside = np.any((mean > rsize + rcent) | (mean < -rsize + rcent))
    limb_outside = np.any(
        (maxs > rsize + rcent + wdist) | (mins < -rsize + rcent - wdist)
    )
    if center_outside or limb_outside:
        pose3d[:, 3] = 0.001
        score = 0.001
        return pose3d, score
    # Calculate reprojection error
    poses_3d = np.expand_dims(pose3d, axis=0)
    repro1, dists1 = utils_pose.project_poses(poses_3d, cam1, calc_dists=True)
    repro2, dists2 = utils_pose.project_poses(poses_3d, cam2, calc_dists=True)
    repro1, dists1 = repro1[0], dists1[0]
    repro2, dists2 = repro2[0], dists2[0]
    # Calculate scores for each view
    iscale = (cam1["width"] + cam1["height"]) / 2
    score1 = score_projection(pose1, repro1, dists1, mask, iscale)
    score2 = score_projection(pose2, repro2, dists2, mask, iscale)
    # Combine scores
    scores = (score1 + score2) / 2
    # Drop lowest scores
    drop_k = math.floor(len(pose1) * 0.2)
    score = np.mean(np.sort(scores, axis=-1)[drop_k:])
    # Add score to 3D pose
    full_scores = np.zeros([poses_3d.shape[1], 1])
    full_scores[mask] = np.expand_dims(scores, axis=-1)
    pose3d[:, 3] = full_scores[:, 0]
    return pose3d, score
 # ==================================================================================================
 def calc_grouping(all_pairs, min_score: float):
    """Groups pairs that share a person"""
    # Calculate the pose center for each pair
    for i in range(len(all_pairs)):
        pair = all_pairs[i]
        pose_3d = pair[2][0]
        mask = pose_3d[:, 3] > min_score
        center = np.mean(pose_3d[mask, 0:3], axis=0)
        all_pairs[i] = all_pairs[i] + [center]
    groups = []
    for i in range(len(all_pairs)):
        pair = all_pairs[i]
        # Create new group if non exists
        if len(groups) == 0:
            groups.append([pair[3], pair[2][0], [pair]])
            continue
        # Check if the pair matches to an existing group
        max_center_dist = 0.6
        max_joint_avg_dist = 0.3
        best_dist = math.inf
        best_group = -1
        for j in range(len(groups)):
            g0 = groups[j]
            center0 = g0[0]
            center1 = pair[3]
            if np.linalg.norm(center0 - center1) < max_center_dist:
                pose0 = g0[1]
                pose1 = pair[2][0]
                # Calculate the distance between the two poses
                mask0 = pose0[:, 3] > min_score
                mask1 = pose1[:, 3] > min_score
                mask = mask0 & mask1
                dists = np.linalg.norm(pose0[mask, 0:3] - pose1[mask, 0:3], axis=1)
                dist = np.mean(dists)
                if dist < max_joint_avg_dist:
                    if dist < best_dist:
                        best_dist = dist
                        best_group = j
        if best_group >= 0:
            # Add pair to existing group and update the mean positions
            group = groups[best_group]
            new_center = (group[0] * len(group[2]) + pair[3]) / (len(group[2]) + 1)
            new_pose = (group[1] * len(group[2]) + pair[2][0]) / (len(group[2]) + 1)
            group[2].append(pair)
            group[0] = new_center
            group[1] = new_pose
        else:
            # Create new group if no match was found
            groups.append([pair[3], pair[2][0], [pair]])
    return groups
 # ==================================================================================================
 def merge_group(poses_3d: np.ndarray, min_score: float):
    """Merges a group of poses into a single pose"""
    # Merge poses to create initial pose
    # Use only those triangulations with a high score
    imask = poses_3d[:, :, 3:4] > min_score
    sum_poses = np.sum(poses_3d * imask, axis=0)
    sum_mask = np.sum(imask, axis=0)
    initial_pose_3d = np.divide(
        sum_poses, sum_mask, where=(sum_mask > 0), out=np.zeros_like(sum_poses)
    )
    # Use center as default if the initial pose is empty
    jmask = initial_pose_3d[:, 3] > 0.0
    sum_joints = np.sum(initial_pose_3d[jmask, 0:3], axis=0)
    sum_mask = np.sum(jmask)
    center = np.divide(
        sum_joints, sum_mask, where=(sum_mask > 0), out=np.zeros_like(sum_joints)
    )
    initial_pose_3d[~jmask, 0:3] = center
    # Drop joints with low scores
    offset = 0.1
    mask = poses_3d[:, :, 3:4] > (min_score - offset)
    # Drop outliers that are far away from the other proposals
    max_dist = 1.2
    distances = np.linalg.norm(
        poses_3d[:, :, :3] - initial_pose_3d[np.newaxis, :, :3], axis=2
    )
    dmask = distances <= max_dist
    mask = mask & np.expand_dims(dmask, axis=-1)
    # Select the best-k proposals for each joint that are closest to the initial pose
    keep_best = 3
    sorted_indices = np.argsort(distances, axis=0)
    best_k_mask = np.zeros_like(mask, dtype=bool)
    num_joints = poses_3d.shape[1]
    for i in range(num_joints):
        valid_indices = sorted_indices[:, i][mask[sorted_indices[:, i], i, 0]]
        best_k_mask[valid_indices[:keep_best], i, 0] = True
    mask = mask & best_k_mask
    # Final pose computation with combined masks
    sum_poses = np.sum(poses_3d * mask, axis=0)
    sum_mask = np.sum(mask, axis=0)
    final_pose_3d = np.divide(
        sum_poses, sum_mask, where=(sum_mask > 0), out=np.zeros_like(sum_poses)
    )
    return final_pose_3d
 # ==================================================================================================
 def get_3d_pose(
    poses_2d,
    camparams,
    roomparams,
    joint_names_2d,
    last_poses_3d=np.array([]),
    min_score=0.95,
 ):
    """Triangulates 3D poses from 2D poses of multiple views"""
    # Convert poses and camparams to numpy arrays
    camparams = copy.deepcopy(camparams)
    for i in range(len(camparams)):
        poses_2d[i] = np.asarray(poses_2d[i])
        camparams[i]["K"] = np.array(camparams[i]["K"])
        camparams[i]["R"] = np.array(camparams[i]["R"])
        camparams[i]["T"] = np.array(camparams[i]["T"])
        camparams[i]["DC"] = np.array(camparams[i]["DC"])
    # Undistort 2D points
    for i in range(len(camparams)):
        poses = poses_2d[i]
        cam = camparams[i]
        poses[:, :, 0:2], cam = undistort_points(poses[:, :, 0:2], cam)
        # Mask out points that are far outside the image (points slightly outside are still valid)
        offset = (cam["width"] + cam["height"]) / 40
        mask = (
            (poses[:, :, 0] >= 0 - offset)
            & (poses[:, :, 0] < cam["width"] + offset)
            & (poses[:, :, 1] >= 0 - offset)
            & (poses[:, :, 1] < cam["height"] + offset)
        )
        poses = poses * np.expand_dims(mask, axis=-1)
        poses_2d[i] = poses
        # Calc projection matrix with updated camera parameters
        cam["P"] = get_camera_P(cam)
        camparams[i] = cam
    # Project last 3D poses to 2D
    last_poses_2d = []
    last_poses_3d = np.asarray(last_poses_3d)
    if last_poses_3d.size > 0:
        for i in range(len(camparams)):
            poses2d, dists = utils_pose.project_poses(last_poses_3d, camparams[i])
            last_poses_2d.append((poses2d, dists))
    # Check matches to old poses
    threshold = min_score - 0.2
    scored_pasts = {}
    if last_poses_3d.size > 0:
        for i in range(len(camparams)):
            scored_pasts[i] = {}
            poses = poses_2d[i]
            last_poses, dists = last_poses_2d[i]
            for j in range(len(last_poses)):
                scored_pasts[i][j] = []
                for k in range(len(poses)):
                    score = calc_pose_score(
                        poses[k],
                        last_poses[j],
                        dists[j],
                        camparams[i],
                        joint_names_2d,
                        core_joints,
                    )
                    if score > threshold:
                        scored_pasts[i][j].append(k)
    # Create pairs of persons
    # Checks if the person was already matched to the last frame and if so only creates pairs with those
    # Else it creates all possible pairs
    num_persons = [len(p) for p in poses_2d]
    all_pairs = []
    for i in range(len(camparams)):
        poses = poses_2d[i]
        for j in range(i + 1, len(poses_2d)):
            poses2 = poses_2d[j]
            for k in range(len(poses)):
                for l in range(len(poses2)):
                    pid1 = sum(num_persons[:i]) + k
                    pid2 = sum(num_persons[:j]) + l
                    match = False
                    if last_poses_3d.size > 0:
                        for m in range(len(last_poses_3d)):
                            if k in scored_pasts[i][m] and l in scored_pasts[j][m]:
                                match = True
                                all_pairs.append([(i, j, k, l), (pid1, pid2)])
                            elif k in scored_pasts[i][m] or l in scored_pasts[j][m]:
                                match = True
                    if not match:
                        all_pairs.append([(i, j, k, l), (pid1, pid2)])
    # Calculate pair scores
    for i in range(len(all_pairs)):
        pair = all_pairs[i]
        pose_3d, score = calc_pair_score(
            pair, poses_2d, camparams, roomparams, joint_names_2d, core_joints
        )
        all_pairs[i].append((pose_3d, score))
        # import draw_utils
        # poses3D = np.array([pose_3d])
        # _ = draw_utils.utils_view.show_poses3d(
        #     poses3D, core_joints, {}, camparams
        # )
        # draw_utils.utils_view.show_plots()
    # Drop pairs with low scores
    all_pairs = [p for p in all_pairs if p[2][1] > min_score]
    # Group pairs that share a person
    groups = calc_grouping(all_pairs, min_score)
    # Calculate full 3D poses
    poses_3d = []
    for pair in all_pairs:
        cam1 = camparams[pair[0][0]]
        cam2 = camparams[pair[0][1]]
        pose1 = poses_2d[pair[0][0]][pair[0][2]]
        pose2 = poses_2d[pair[0][1]][pair[0][3]]
        pose_3d, _ = triangulate_and_score(pose1, pose2, cam1, cam2, roomparams)
        pair.append(pose_3d)
    # Merge groups
    poses_3d = []
    for group in groups:
        poses = np.array([p[4] for p in group[2]])
        pose_3d = merge_group(poses, min_score)
        poses_3d.append(pose_3d)
    if len(poses_3d) > 0:
        poses3D = np.array(poses_3d)
    else:
        poses3D = np.zeros([1, len(joint_names_2d), 4])
    return poses3D
--- a/spt/camera.cpp
+++ b/spt/camera.cpp
@ -0,0 +1,75 @@
 #include <iomanip>
 #include <sstream>
 #include "camera.hpp"
 // =================================================================================================
 // =================================================================================================
 template <size_t M, size_t N>
 static const std::string print_matrix(const std::array<std::array<float, N>, M> &matrix)
 {
    std::ostringstream out;
    out << "[";
    for (size_t j = 0; j < M; ++j)
    {
        out << "[";
        for (size_t i = 0; i < N; ++i)
        {
            out << matrix[j][i];
            if (i < N - 1)
            {
                out << ", ";
            }
        }
        out << "]";
        if (j < M - 1)
        {
            out << ", ";
        }
    }
    out << "]";
    return out.str();
 }
 // =================================================================================================
 // =================================================================================================
 std::string Camera::to_string() const
 {
    std::ostringstream out;
    out << std::fixed << std::setprecision(6);
    out << "{";
    out << "'name': '" << name << "', ";
    out << "'K': " << print_matrix(K) << ", ";
    out << "'DC': [";
    for (size_t i = 0; i < DC.size(); ++i)
    {
        out << DC[i];
        if (i < DC.size() - 1)
            out << ", ";
    }
    out << "], ";
    out << "'R': " << print_matrix(R) << ", ";
    out << "'T': " << print_matrix(T) << ", ";
    out << "'P': " << print_matrix(P) << ", ";
    out << "'width': " << width << ", ";
    out << "'height': " << height << ", ";
    out << "'type': " << type;
    out << "}";
    return out.str();
 }
 // =================================================================================================
 std::ostream &operator<<(std::ostream &out, const Camera &cam)
 {
    out << cam.to_string();
    return out;
 }
--- a/spt/camera.hpp
+++ b/spt/camera.hpp
@ -0,0 +1,24 @@
 #pragma once
 #include <array>
 #include <iostream>
 #include <string>
 #include <vector>
 // =================================================================================================
 struct Camera
 {
    std::string name;
    std::array<std::array<float, 3>, 3> K;
    std::vector<float> DC;
    std::array<std::array<float, 3>, 3> R;
    std::array<std::array<float, 1>, 3> T;
    std::array<std::array<float, 3>, 4> P;
    int width;
    int height;
    std::string type;
    friend std::ostream &operator<<(std::ostream &out, Camera const &camera);
    std::string to_string() const;
 };
--- a/spt/interface.cpp
+++ b/spt/interface.cpp
@ -0,0 +1,35 @@
 #include "triangulator.hpp"
 #include "interface.hpp"
 // =================================================================================================
 // =================================================================================================
 Triangulator::Triangulator(float min_score, size_t min_group_size)
 {
    this->triangulator = new TriangulatorInternal(min_score, min_group_size);
 }
 // =================================================================================================
 std::vector<std::vector<std::array<float, 4>>> Triangulator::triangulate_poses(
    const std::vector<std::vector<std::vector<std::array<float, 3>>>> &poses_2d,
    const std::vector<Camera> &cameras,
    const std::array<std::array<float, 3>, 2> &roomparams,
    const std::vector<std::string> &joint_names)
 {
    return this->triangulator->triangulate_poses(poses_2d, cameras, roomparams, joint_names);
 }
 // =================================================================================================
 void Triangulator::reset()
 {
    this->triangulator->reset();
 }
 // =================================================================================================
 void Triangulator::print_stats()
 {
    this->triangulator->print_stats();
 }
--- a/spt/interface.hpp
+++ b/spt/interface.hpp
@ -0,0 +1,54 @@
 #pragma once
 #include <string>
 #include <vector>
 #include "camera.hpp"
 // =================================================================================================
 // Forward declaration of the class, that swig does not try to parse all its dependencies.
 class TriangulatorInternal;
 // =================================================================================================
 class Triangulator
 {
 public:
    /**
     * Triangulator to predict poses from multiple views.
     *
     *
     * @param min_score Minimum score to consider a triangulated joint as valid.
     * @param min_group_size Minimum number of camera pairs that need to see a person.
     */
    Triangulator(
        float min_score = 0.95,
        size_t min_group_size = 1);
    /**
     * Calculate a triangulation.
     *
     *
     * @param poses_2d List of shape [views, persons, joints, 3], containing the 2D poses.
     * @param cameras List of cameras.
     * @param roomparams Room parameters (room size, room center).
     * @param joint_names List of 2D joint names.
     *
     * @return List of shape [persons, joints, 4], containing the 3D poses.
     */
    std::vector<std::vector<std::array<float, 4>>> triangulate_poses(
        const std::vector<std::vector<std::vector<std::array<float, 3>>>> &poses_2d,
        const std::vector<Camera> &cameras,
        const std::array<std::array<float, 3>, 2> &roomparams,
        const std::vector<std::string> &joint_names);
    /** Reset the triangulator. */
    void reset();
    /** Print triangulation statistics. */
    void print_stats();
 private:
    TriangulatorInternal *triangulator;
 };
--- a/spt/triangulator.cpp
+++ b/spt/triangulator.cpp
--- a/spt/triangulator.hpp
+++ b/spt/triangulator.hpp
@ -0,0 +1,133 @@
 #pragma once
 #include <array>
 #include <iostream>
 #include <string>
 #include <vector>
 #include <opencv2/opencv.hpp>
 #include "camera.hpp"
 // =================================================================================================
 class CameraInternal
 {
 public:
    CameraInternal(const Camera &cam);
    Camera cam;
    cv::Mat K;
    cv::Mat DC;
    cv::Mat R;
    cv::Mat T;
    cv::Mat P;
    void update_projection_matrix();
 };
 // =================================================================================================
 class TriangulatorInternal
 {
 public:
    TriangulatorInternal(float min_score, size_t min_group_size);
    std::vector<std::vector<std::array<float, 4>>> triangulate_poses(
        const std::vector<std::vector<std::vector<std::array<float, 3>>>> &poses_2d,
        const std::vector<Camera> &cameras,
        const std::array<std::array<float, 3>, 2> &roomparams,
        const std::vector<std::string> &joint_names);
    void reset();
    void print_stats();
 private:
    float min_score;
    float min_group_size;
    const std::vector<std::string> core_joints = {
        "shoulder_left",
        "shoulder_right",
        "hip_left",
        "hip_right",
        "elbow_left",
        "elbow_right",
        "knee_left",
        "knee_right",
        "wrist_left",
        "wrist_right",
        "ankle_left",
        "ankle_right",
    };
    const std::vector<std::pair<std::string, std::string>> core_limbs = {
        {"knee_left", "ankle_left"},
        {"hip_left", "knee_left"},
        {"hip_right", "knee_right"},
        {"knee_right", "ankle_right"},
        {"elbow_left", "wrist_left"},
        {"elbow_right", "wrist_right"},
        {"shoulder_left", "elbow_left"},
        {"shoulder_right", "elbow_right"},
    };
    std::vector<cv::Mat> last_poses_3d;
    void undistort_poses(std::vector<cv::Mat> &poses, CameraInternal &icam);
    std::tuple<std::vector<cv::Mat>, std::vector<cv::Mat>> project_poses(
        const std::vector<cv::Mat> &bodies3D, const CameraInternal &icam, bool calc_dists);
    float calc_pose_score(
        const cv::Mat &pose1,
        const cv::Mat &pose2,
        const cv::Mat &dist1,
        const CameraInternal &icam);
    cv::Mat score_projection(
        const cv::Mat &pose1,
        const cv::Mat &repro1,
        const cv::Mat &dists1,
        const cv::Mat &mask,
        float iscale);
    std::pair<cv::Mat, float> triangulate_and_score(
        const cv::Mat &pose1,
        const cv::Mat &pose2,
        const CameraInternal &cam1,
        const CameraInternal &cam2,
        const std::array<std::array<float, 3>, 2> &roomparams,
        const std::vector<std::array<size_t, 2>> &core_limbs_idx);
    std::vector<std::tuple<cv::Point3f, cv::Mat, std::vector<int>>> calc_grouping(
        const std::vector<std::pair<std::tuple<int, int, int, int>, std::pair<int, int>>> &all_pairs,
        const std::vector<std::pair<cv::Mat, float>> &all_scored_poses,
        float min_score);
    cv::Mat merge_group(const std::vector<cv::Mat> &poses_3d, float min_score);
    void add_extra_joints(std::vector<cv::Mat> &poses, const std::vector<std::string> &joint_names);
    void filter_poses(
        std::vector<cv::Mat> &poses,
        const std::array<std::array<float, 3>, 2> &roomparams,
        const std::vector<size_t> &core_joint_idx,
        const std::vector<std::array<size_t, 2>> &core_limbs_idx);
    void add_missing_joints(
        std::vector<cv::Mat> &poses, const std::vector<std::string> &joint_names);
    // Statistics
    float num_calls = 0;
    float total_time = 0;
    float init_time = 0;
    float undistort_time = 0;
    float project_time = 0;
    float match_time = 0;
    float pairs_time = 0;
    float pair_scoring_time = 0;
    float grouping_time = 0;
    float full_time = 0;
    float merge_time = 0;
    float post_time = 0;
    float convert_time = 0;
 };
--- a/swig/Makefile
+++ b/swig/Makefile
@ -0,0 +1,13 @@
 # Standard compile options for the C++ executable
 FLAGS = -fPIC -O3 -march=native -Wall -Werror -flto -fopenmp -fopenmp-simd
 # The Python interface through SWIG
 PYTHONI = -I/usr/include/python3.8/
 PYTHONL = -Xlinker -export-dynamic
 # Default super-target
 all:
 	cd ../spt/ && g++ $(FLAGS) -std=c++2a -I/usr/include/opencv4 -c *.cpp ; cd ../swig/
 	swig -c++ -python -keyword -o spt_wrap.cxx spt.i
 	g++ $(FLAGS) $(PYTHONI) -c spt_wrap.cxx -o spt_wrap.o
 	g++ $(FLAGS) $(PYTHONL) -shared ../spt/*.o spt_wrap.o -lopencv_core -lopencv_imgproc -lopencv_calib3d -o _spt.so
--- a/swig/spt.i
+++ b/swig/spt.i
@ -0,0 +1,70 @@
 %module spt
 %{
    // Includes the header in the wrapper code
    #include "../spt/camera.hpp"
    #include "../spt/interface.hpp"
 %}
 // Some modules need extra imports beside the main .hpp file
 %include "std_array.i"
 %include "std_string.i"
 %include "std_vector.i"
 // Instantiate templates used by example
 // If the template is too nested (>2), parts of it need to be declared as well
 namespace std {
    %template(FloatMatrix_3x3) array<array<float, 3>, 3>;
    %template(VectorFloat) vector<float>;
    %template(FloatMatrix_3x1) array<array<float, 1>, 3>;
    %template(FloatMatrix_3x4) array<array<float, 3>, 4>;
    %template(Matrix_Jx4) vector<array<float, 4>>;
    %template(Matrix_NxJx4) vector<vector<array<float, 4>>>;
    %template(Matrix_Jx3) vector<array<float, 3>>;
    %template(Matrix_VxNxJx3) vector<vector<vector<array<float, 3>>>>;
    %template(VectorCamera) vector<Camera>;
    %template(FloatMatrix_2x3) array<array<float, 3>, 2>;
    %template(VectorString) vector<std::string>;
 }
 // Convert vector to native (python) list
 %naturalvar Camera::K;
 %naturalvar Camera::DC;
 %naturalvar Camera::R;
 %naturalvar Camera::T;
 // Improve printing of result objects
 %extend Camera {
    std::string __str__() const {
         return $self->to_string();
    }
 }
 // Ignore: Warning 503: Can't wrap 'operator <<' unless renamed to a valid identifier.
 %warnfilter(503) Camera;
 // Ignore: Warning 511: Can't use keyword arguments with overloaded functions.
 // The warning is cause by enabling keyword arguments, which doesn't work for vectors.
 #pragma SWIG nowarn=511
 // Parse the header file to generate wrappers
 %include "../spt/camera.hpp"
 %include "../spt/interface.hpp"
 // Add additional Python code to the module
 %pythoncode %{
 def convert_cameras(cameras):
    """Convert cameras from Python to C++."""
    c_cameras = []
    for cam in cameras:
        camera = Camera()
        camera.name = cam["name"]
        camera.K = cam["K"]
        camera.DC = cam["DC"]
        camera.R = cam["R"]
        camera.T = cam["T"]
        camera.width = cam["width"]
        camera.height = cam["height"]
        camera.type = cam.get("type", "pinhole")
        c_cameras.append(camera)
    return c_cameras
 %}
--- a/tests/poses_e1.json
+++ b/tests/poses_e1.json
--- a/tests/poses_h1.json
+++ b/tests/poses_h1.json
@ -0,0 +1,544 @@
 {
    "2D": [
        [
            [
                [
                    445.214,
                    373.348,
                    0.805
                ],
                [
                    446.448,
                    367.181,
                    0.834
                ],
                [
                    446.859,
                    370.881,
                    0.447
                ],
                [
                    456.726,
                    365.947,
                    0.974
                ],
                [
                    484.272,
                    374.17,
                    0.745
                ],
                [
                    445.625,
                    385.271,
                    0.611
                ],
                [
                    505.24,
                    409.528,
                    0.761
                ],
                [
                    393.411,
                    385.682,
                    0.486
                ],
                [
                    484.683,
                    447.352,
                    0.477
                ],
                [
                    369.976,
                    385.271,
                    0.672
                ],
                [
                    452.203,
                    456.808,
                    0.292
                ],
                [
                    442.336,
                    503.677,
                    0.504
                ],
                [
                    478.927,
                    502.444,
                    0.505
                ],
                [
                    414.79,
                    508.2,
                    0.462
                ],
                [
                    428.769,
                    476.131,
                    0.332
                ],
                [
                    423.835,
                    576.037,
                    0.689
                ],
                [
                    379.433,
                    497.099,
                    0.485
                ],
                [
                    460.632,
                    503.061,
                    0.504
                ],
                [
                    475.433,
                    397.399,
                    0.611
                ],
                [
                    470.499,
                    370.059,
                    0.745
                ]
            ]
        ],
        [
            [
                [
                    502.664,
                    372.786,
                    0.81
                ],
                [
                    503.643,
                    363.001,
                    0.894
                ],
                [
                    492.39,
                    368.383,
                    0.862
                ],
                [
                    508.535,
                    351.26,
                    0.85
                ],
                [
                    479.181,
                    367.405,
                    0.837
                ],
                [
                    536.422,
                    367.894,
                    0.721
                ],
                [
                    476.245,
                    392.356,
                    0.785
                ],
                [
                    584.367,
                    370.829,
                    0.867
                ],
                [
                    464.993,
                    441.279,
                    0.717
                ],
                [
                    560.883,
                    385.017,
                    0.72
                ],
                [
                    470.864,
                    392.356,
                    0.687
                ],
                [
                    542.292,
                    469.166,
                    0.674
                ],
                [
                    503.153,
                    467.698,
                    0.639
                ],
                [
                    502.664,
                    506.837,
                    0.765
                ],
                [
                    458.633,
                    454.489,
                    0.798
                ],
                [
                    471.842,
                    589.518,
                    0.813
                ],
                [
                    530.551,
                    499.988,
                    0.71
                ],
                [
                    522.723,
                    468.432,
                    0.639
                ],
                [
                    506.333,
                    380.125,
                    0.721
                ],
                [
                    493.858,
                    359.332,
                    0.837
                ]
            ]
        ],
        [
            [
                [
                    635.959,
                    325.896,
                    0.26
                ],
                [
                    603.03,
                    315.205,
                    0.37
                ],
                [
                    647.506,
                    325.896,
                    0.366
                ],
                [
                    611.155,
                    316.488,
                    0.826
                ],
                [
                    641.519,
                    327.607,
                    0.878
                ],
                [
                    577.37,
                    334.877,
                    0.652
                ],
                [
                    652.638,
                    364.385,
                    0.766
                ],
                [
                    532.466,
                    334.877,
                    0.77
                ],
                [
                    650.5,
                    405.44,
                    0.57
                ],
                [
                    569.672,
                    337.015,
                    0.406
                ],
                [
                    631.255,
                    375.504,
                    0.375
                ],
                [
                    573.521,
                    461.463,
                    0.659
                ],
                [
                    617.57,
                    458.897,
                    0.573
                ],
                [
                    614.576,
                    471.727,
                    0.287
                ],
                [
                    656.487,
                    410.145,
                    0.653
                ],
                [
                    643.657,
                    520.908,
                    0.599
                ],
                [
                    631.255,
                    512.782,
                    0.262
                ],
                [
                    595.546,
                    460.18,
                    0.573
                ],
                [
                    615.004,
                    349.631,
                    0.652
                ],
                [
                    626.337,
                    322.047,
                    0.826
                ]
            ]
        ],
        [
            [
                [
                    512.076,
                    343.77,
                    0.704
                ],
                [
                    518.561,
                    335.34,
                    0.855
                ],
                [
                    502.349,
                    336.637,
                    0.799
                ],
                [
                    523.1,
                    323.667,
                    0.76
                ],
                [
                    480.3,
                    324.964,
                    0.887
                ],
                [
                    534.773,
                    328.855,
                    0.743
                ],
                [
                    446.579,
                    361.928,
                    0.849
                ],
                [
                    592.488,
                    330.152,
                    0.802
                ],
                [
                    479.652,
                    423.534,
                    0.795
                ],
                [
                    621.022,
                    343.77,
                    0.904
                ],
                [
                    491.324,
                    362.576,
                    0.811
                ],
                [
                    523.1,
                    450.77,
                    0.671
                ],
                [
                    472.518,
                    461.146,
                    0.7
                ],
                [
                    549.688,
                    510.431,
                    0.776
                ],
                [
                    491.324,
                    448.825,
                    0.757
                ],
                [
                    528.937,
                    624.565,
                    0.855
                ],
                [
                    587.949,
                    496.813,
                    0.741
                ],
                [
                    497.809,
                    455.958,
                    0.671
                ],
                [
                    490.676,
                    345.391,
                    0.743
                ],
                [
                    501.7,
                    324.316,
                    0.76
                ]
            ]
        ]
    ],
    "3D": [
        [
            [
                -0.04,
                -0.124,
                1.088,
                0.943
            ],
            [
                -0.0,
                -0.069,
                1.127,
                0.92
            ],
            [
                -0.082,
                -0.15,
                1.106,
                0.964
            ],
            [
                -0.005,
                -0.051,
                1.159,
                0.952
            ],
            [
                -0.148,
                -0.059,
                1.111,
                0.983
            ],
            [
                0.115,
                0.064,
                1.093,
                0.981
            ],
            [
                -0.234,
                0.076,
                0.968,
                0.98
            ],
            [
                0.354,
                0.051,
                1.09,
                0.988
            ],
            [
                -0.189,
                -0.105,
                0.754,
                0.964
            ],
            [
                0.315,
                -0.244,
                1.063,
                0.969
            ],
            [
                -0.151,
                -0.009,
                0.955,
                0.925
            ],
            [
                0.121,
                0.2,
                0.563,
                0.952
            ],
            [
                -0.081,
                0.16,
                0.547,
                0.967
            ],
            [
                0.071,
                -0.242,
                0.451,
                0.955
            ],
            [
                -0.172,
                -0.237,
                0.703,
                0.993
            ],
            [
                -0.047,
                -0.396,
                0.093,
                0.985
            ],
            [
                0.224,
                -0.293,
                0.521,
                0.972
            ],
            [
                0.026,
                0.185,
                0.55,
                0.95
            ],
            [
                -0.062,
                0.085,
                1.026,
                0.991
            ],
            [
                -0.077,
                -0.051,
                1.134,
                0.971
            ]
        ]
    ]
 }
--- a/tests/poses_p1.json
+++ b/tests/poses_p1.json
--- a/tests/test_interface.py
+++ b/tests/test_interface.py
@ -0,0 +1,132 @@
 import json
 import sys
 import time
 import numpy as np
 sys.path.append("../swig/")
 import spt
 # ==================================================================================================
 def main():
    print("")
    # Test camera structure
    camera = spt.Camera()
    camera.name = "Camera 1"
    camera.K = [[1, 0, 0], [0, 1, 0], [0, 0, 1]]
    camera.DC = [0, 0, 0, 0, 0]
    camera.R = [[1, 0, 0], [0, 1, 0], [0, 0, 1]]
    camera.T = [[1], [2], [3]]
    camera.width = 640
    camera.height = 480
    print(camera)
    print("")
    # Load input data
    roomparams = [[4.8, 6.0, 2.0], [0, 0, 1.0]]
    joint_names = [
        "nose",
        "eye_left",
        "eye_right",
        "ear_left",
        "ear_right",
        "shoulder_left",
        "shoulder_right",
        "elbow_left",
        "elbow_right",
        "wrist_left",
        "wrist_right",
        "hip_left",
        "hip_right",
        "knee_left",
        "knee_right",
        "ankle_left",
        "ankle_right",
        "hip_middle",
        "shoulder_middle",
        "head",
    ]
    cpath = "/SimplePoseTriangulation/data/h1/sample.json"
    ppath = "/SimplePoseTriangulation/tests/poses_h1.json"
    with open(cpath, "r") as file:
        cdata = json.load(file)
    with open(ppath, "r") as file:
        pdata = json.load(file)
    cams = cdata["cameras"]
    poses_2d = pdata["2D"]
    cameras = spt.convert_cameras(cams)
    # Run triangulation
    triangulator = spt.Triangulator(min_score=0.95)
    stime = time.time()
    poses_3d = triangulator.triangulate_poses(
        poses_2d, cameras, roomparams, joint_names
    )
    print("3D time:", time.time() - stime)
    print(np.array(poses_3d))
    print("")
    # Load input data
    roomparams = [[5.6, 6.4, 2.4], [0, -0.5, 1.2]]
    cpath = "/SimplePoseTriangulation/data/p1/sample.json"
    ppath = "/SimplePoseTriangulation/tests/poses_p1.json"
    with open(cpath, "r") as file:
        cdata = json.load(file)
    with open(ppath, "r") as file:
        pdata = json.load(file)
    cams = cdata["cameras"]
    poses_2d = pdata["2D"]
    cameras = spt.convert_cameras(cams)
    # Run triangulation
    triangulator.reset()
    stime = time.time()
    poses_3d = triangulator.triangulate_poses(
        poses_2d, cameras, roomparams, joint_names
    )
    print("3D time:", time.time() - stime)
    print(np.array(poses_3d))
    print("")
    # Run again to test last pose cache
    stime = time.time()
    poses_3d = triangulator.triangulate_poses(
        poses_2d, cameras, roomparams, joint_names
    )
    print("3D time:", time.time() - stime)
    print(np.array(poses_3d))
    print("")
    # Load input data
    roomparams = [[6.0, 5.0, 2.0], [1.5, 1.0, -0.5]]
    cpath = "/SimplePoseTriangulation/data/e1/sample.json"
    ppath = "/SimplePoseTriangulation/tests/poses_e1.json"
    with open(cpath, "r") as file:
        cdata = json.load(file)
    with open(ppath, "r") as file:
        pdata = json.load(file)
    cams = cdata["cameras"]
    poses_2d = pdata["2D"]
    cameras = spt.convert_cameras(cams)
    # Run triangulation
    triangulator.reset()
    stime = time.time()
    poses_3d = triangulator.triangulate_poses(
        poses_2d, cameras, roomparams, joint_names
    )
    print("3D time:", time.time() - stime)
    print(np.array(poses_3d))
    print("")
    triangulator.print_stats()
    print("")
 # ==================================================================================================
 if __name__ == "__main__":
    main()
+{
+    "2D": [
+        [
+            [
+                [
+.214,
+.348,
+.805
+                ],
+                [
+.448,
+.181,
+.834
+                ],
+                [
+.859,
+.881,
+.447
+                ],
+                [
+.726,
+.947,
+.974
+                ],
+                [
+.272,
+.17,
+.745
+                ],
+                [
+.625,
+.271,
+.611
+                ],
+                [
+.24,
+.528,
+.761
+                ],
+                [
+.411,
+.682,
+.486
+                ],
+                [
+.683,
+.352,
+.477
+                ],
+                [
+.976,
+.271,
+.672
+                ],
+                [
+.203,
+.808,
+.292
+                ],
+                [
+.336,
+.677,
+.504
+                ],
+                [
+.927,
+.444,
+.505
+                ],
+                [
+.79,
+.2,
+.462
+                ],
+                [
+.769,
+.131,
+.332
+                ],
+                [
+.835,
+.037,
+.689
+                ],
+                [
+.433,
+.099,
+.485
+                ],
+                [
+.632,
+.061,
+.504
+                ],
+                [
+.433,
+.399,
+.611
+                ],
+                [
+.499,
+.059,
+.745
+                ]
+            ]
+        ],
+        [
+            [
+                [
+.664,
+.786,
+.81
+                ],
+                [
+.643,
+.001,
+.894
+                ],
+                [
+.39,
+.383,
+.862
+                ],
+                [
+.535,
+.26,
+.85
+                ],
+                [
+.181,
+.405,
+.837
+                ],
+                [
+.422,
+.894,
+.721
+                ],
+                [
+.245,
+.356,
+.785
+                ],
+                [
+.367,
+.829,
+.867
+                ],
+                [
+.993,
+.279,
+.717
+                ],
+                [
+.883,
+.017,
+.72
+                ],
+                [
+.864,
+.356,
+.687
+                ],
+                [
+.292,
+.166,
+.674
+                ],
+                [
+.153,
+.698,
+.639
+                ],
+                [
+.664,
+.837,
+.765
+                ],
+                [
+.633,
+.489,
+.798
+                ],
+                [
+.842,
+.518,
+.813
+                ],
+                [
+.551,
+.988,
+.71
+                ],
+                [
+.723,
+.432,
+.639
+                ],
+                [
+.333,
+.125,
+.721
+                ],
+                [
+.858,
+.332,
+.837
+                ]
+            ]
+        ],
+        [
+            [
+                [
+.959,
+.896,
+.26
+                ],
+                [
+.03,
+.205,
+.37
+                ],
+                [
+.506,
+.896,
+.366
+                ],
+                [
+.155,
+.488,
+.826
+                ],
+                [
+.519,
+.607,
+.878
+                ],
+                [
+.37,
+.877,
+.652
+                ],
+                [
+.638,
+.385,
+.766
+                ],
+                [
+.466,
+.877,
+.77
+                ],
+                [
+.5,
+.44,
+.57
+                ],
+                [
+.672,
+.015,
+.406
+                ],
+                [
+.255,
+.504,
+.375
+                ],
+                [
+.521,
+.463,
+.659
+                ],
+                [
+.57,
+.897,
+.573
+                ],
+                [
+.576,
+.727,
+.287
+                ],
+                [
+.487,
+.145,
+.653
+                ],
+                [
+.657,
+.908,
+.599
+                ],
+                [
+.255,
+.782,
+.262
+                ],
+                [
+.546,
+.18,
+.573
+                ],
+                [
+.004,
+.631,
+.652
+                ],
+                [
+.337,
+.047,
+.826
+                ]
+            ]
+        ],
+        [
+            [
+                [
+.076,
+.77,
+.704
+                ],
+                [
+.561,
+.34,
+.855
+                ],
+                [
+.349,
+.637,
+.799
+                ],
+                [
+.1,
+.667,
+.76
+                ],
+                [
+.3,
+.964,
+.887
+                ],
+                [
+.773,
+.855,
+.743
+                ],
+                [
+.579,
+.928,
+.849
+                ],
+                [
+.488,
+.152,
+.802
+                ],
+                [
+.652,
+.534,
+.795
+                ],
+                [
+.022,
+.77,
+.904
+                ],
+                [
+.324,
+.576,
+.811
+                ],
+                [
+.1,
+.77,
+.671
+                ],
+                [
+.518,
+.146,
+.7
+                ],
+                [
+.688,
+.431,
+.776
+                ],
+                [
+.324,
+.825,
+.757
+                ],
+                [
+.937,
+.565,
+.855
+                ],
+                [
+.949,
+.813,
+.741
+                ],
+                [
+.809,
+.958,
+.671
+                ],
+                [
+.676,
+.391,
+.743
+                ],
+                [
+.7,
+.316,
+.76
+                ]
+            ]
+        ]
+    ],
+    "3D": [
+        [
+            [
+                -0.04,
+                -0.124,
+.088,
+.943
+            ],
+            [
+                -0.0,
+                -0.069,
+.127,
+.92
+            ],
+            [
+                -0.082,
+                -0.15,
+.106,
+.964
+            ],
+            [
+                -0.005,
+                -0.051,
+.159,
+.952
+            ],
+            [
+                -0.148,
+                -0.059,
+.111,
+.983
+            ],
+            [
+.115,
+.064,
+.093,
+.981
+            ],
+            [
+                -0.234,
+.076,
+.968,
+.98
+            ],
+            [
+.354,
+.051,
+.09,
+.988
+            ],
+            [
+                -0.189,
+                -0.105,
+.754,
+.964
+            ],
+            [
+.315,
+                -0.244,
+.063,
+.969
+            ],
+            [
+                -0.151,
+                -0.009,
+.955,
+.925
+            ],
+            [
+.121,
+.2,
+.563,
+.952
+            ],
+            [
+                -0.081,
+.16,
+.547,
+.967
+            ],
+            [
+.071,
+                -0.242,
+.451,
+.955
+            ],
+            [
+                -0.172,
+                -0.237,
+.703,
+.993
+            ],
+            [
+                -0.047,
+                -0.396,
+.093,
+.985
+            ],
+            [
+.224,
+                -0.293,
+.521,
+.972
+            ],
+            [
+.026,
+.185,
+.55,
+.95
+            ],
+            [
+                -0.062,
+.085,
+.026,
+.991
+            ],
+            [
+                -0.077,
+                -0.051,
+.134,
+.971
+            ]
+        ]
+    ]
+}