"""Utilities for exoskeleton-based robot state estimation."""
import cv2
import numpy as np
import mujoco
import mink
from scipy.spatial.transform import Rotation as R
from typing import Dict, Tuple, Optional
from cv2 import aruco
import matplotlib.pyplot as plt

# ArUco dictionary
ARUCO_DICT = aruco.getPredefinedDictionary(aruco.DICT_6X6_250)

def do_est_aruco_pose(frame, aruco_dict, board, board_length, cameraMatrix=None, distCoeffs=None, pose_vis=None, corners_est=None,corners_vis=None):
    """Estimate ArUco pose - copied from aruco_helpers.py"""
    from cv2 import aruco
    gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY).astype(np.uint8)
    if corners_est is None: corners, ids, rejected = cv2.aruco.detectMarkers(gray, aruco_dict, parameters=aruco.DetectorParameters())
    else: corners, ids, rejected,  = corners_est
    if ids is None: return -1
    
    corners_vis = cv2.aruco.drawDetectedMarkers(cv2.cvtColor(gray, cv2.COLOR_GRAY2BGR) if corners_vis is None else corners_vis, corners, ids)
    W, H = frame.shape[:2][::-1]
    f0 = max(W, H)//2
    if distCoeffs is None: distCoeffs = dist_coeffs_init = np.zeros((8, 1), dtype=np.float64)
    if cameraMatrix is None:
        camera_matrix_init = np.array([[f0, 0, W/2.0], [0, f0, H/2.0], [0, 0, 1.0]], dtype=np.float64)
        flags = (cv2.CALIB_ZERO_TANGENT_DIST | cv2.CALIB_FIX_K1 | cv2.CALIB_FIX_K2 | cv2.CALIB_FIX_K3 | 
                 cv2.CALIB_FIX_K4 | cv2.CALIB_FIX_K5 | cv2.CALIB_FIX_K6 | cv2.CALIB_FIX_ASPECT_RATIO | 
                 cv2.CALIB_FIX_PRINCIPAL_POINT)
        ret, cameraMatrix, distCoeffs, rvecs, tvecs = aruco.calibrateCameraAruco( corners, ids, np.array([len(ids)]), board, gray.shape[::-1], camera_matrix_init, dist_coeffs_init, flags=flags)

    # Use solvePnPGeneric to remove pose ambiguity
    obj_pts, img_pts = cv2.aruco.getBoardObjectAndImagePoints(board, corners, ids)
    if obj_pts is None or obj_pts.size == 0: return -1
    obj_pts = obj_pts.reshape(-1, 3).astype(np.float32)
    img_pts = img_pts.reshape(-1, 2).astype(np.float32)
    
    # Request all valid PnP solutions
    ok, rvecs, tvecs, _ = cv2.solvePnPGeneric(obj_pts, img_pts, cameraMatrix, distCoeffs, flags=cv2.SOLVEPNP_IPPE)
    
    # Choose the pose whose board normal points toward the camera
    best_idx = 0
    for i, (rv, tv) in enumerate(zip(rvecs, tvecs)):
        R_mat, _ = cv2.Rodrigues(rv)
        normal = R_mat @ np.array([0., 0., 1.])  # board +Z in camera coords
        board_in_front = tv[2] > 0  # Z must be positive
        faces_camera = normal[2] < 0  # normal points toward camera
        if board_in_front and faces_camera:
            best_idx = i
            break
    rvec, tvec = rvecs[best_idx][:, 0], tvecs[best_idx][:, 0]

    # Compute object points in camera frame for confidence estimate
    obj_pts_cam = (cv2.Rodrigues(rvec)[0] @ obj_pts.T + tvec.reshape(3, 1)).T
    img_reproj, _ = cv2.projectPoints(obj_pts, rvec, tvec, cameraMatrix, distCoeffs)
    img_reproj = img_reproj.reshape(-1, 2)

    R_mat = cv2.Rodrigues(rvec)[0]
    center_offset_board = np.array([board_length/2, board_length/2, 0], dtype=np.float64)
    tvec = tvec + R_mat.dot(center_offset_board)
    
    # Draw axes - use fixed small size (0.03m = 30mm)
    pose_vis = cv2.drawFrameAxes(corners_vis, cameraMatrix, np.zeros((1, 5)), rvec, tvec, 0.03)
    
    est_aruco_pose = np.eye(4)
    est_aruco_pose[:3, 3] = tvec
    est_aruco_pose[:3, :3] = R_mat
    est_aruco_pose[:, 1:-1] *= -1

    return { "est_aruco_pose": est_aruco_pose, "pose_vis": pose_vis, "corners_vis": corners_vis, "corners": (ids.flatten(), corners), "cameraMatrix": cameraMatrix, "rtvec": (rvec, tvec), "distCoeffs": distCoeffs, "corners_est": (corners, ids, rejected), "obj_img_pts":(obj_pts_cam,img_pts),}


def get_link_poses_from_robot( robot_config, model: mujoco.MjModel, data: mujoco.MjData):
    """Extract link poses from robot's current state.
    """
    link_poses = {}
    for link_name, cfg in robot_config.links.items():
        # Get the robot body (not the exoskeleton mocap body)
        body_id = mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, cfg.pybullet_name)
        
        # Validate quaternion
        quat_wxyz = data.xquat[body_id]
        if np.linalg.norm(quat_wxyz) < 0.01: continue
        
        pose = np.eye(4)
        pose[:3, :3] = R.from_quat(quat_wxyz[[1, 2, 3, 0]]).as_matrix()
        pose[:3, 3] = data.xpos[body_id]
        link_poses[link_name] = pose
    
    return link_poses


def get_body_pose_in_world(
    model: mujoco.MjModel, data: mujoco.MjData, body_name: str
) -> np.ndarray:
    """4x4 homogeneous world pose of the named body origin (MuJoCo `xpos` / `xquat`)."""
    body_id = mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, body_name)
    if body_id < 0:
        raise ValueError(f"Body not found: {body_name!r}")
    quat_wxyz = data.xquat[body_id]
    if np.linalg.norm(quat_wxyz) < 0.01:
        raise ValueError(f"Invalid quaternion for body {body_name!r}")
    pose = np.eye(4, dtype=np.float64)
    pose[:3, :3] = R.from_quat(quat_wxyz[[1, 2, 3, 0]]).as_matrix()
    pose[:3, 3] = data.xpos[body_id]
    return pose


def position_exoskeleton_meshes( robot_config, model: mujoco.MjModel, data: mujoco.MjData, link_poses: Dict[str, np.ndarray] = None):
    """Position virtual exoskeleton meshes """
    for link_name, cfg in robot_config.links.items():

        # Get link pose
        if link_poses is not None and link_name in link_poses:
            # Use detected pose (already in world coordinates from detection)
            link_pose = link_poses[link_name]
            link_pos = link_pose[:3, 3]
            
            # Validate rotation matrix
            rot_mat = link_pose[:3, :3]
            if not np.allclose(np.linalg.det(rot_mat), 1.0, atol=0.01): continue
            
            link_rot = R.from_matrix(rot_mat)
            link_quat_wxyz = link_rot.as_quat()[[3, 0, 1, 2]]  # xyzw to wxyz
        else:
            # Use robot's current state 
            body_id = model.body(cfg.pybullet_name).id
            link_pos = data.xpos[body_id]
            link_quat_wxyz = data.xquat[body_id]
            try: link_rot = R.from_quat(link_quat_wxyz[[1, 2, 3, 0]])  # wxyz to xyzw
            except: continue

        # Set link mesh position and orientation
        link_mocap_id = model.body_mocapid[mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, f"{link_name}_link_mesh")]
        data.mocap_pos[link_mocap_id] = link_pos
        data.mocap_quat[link_mocap_id] = link_quat_wxyz

        # Set exo mesh (same as link)
        exo_mesh_mocap_id = model.body_mocapid[mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, f"{link_name}_exo_mesh")]
        data.mocap_pos[exo_mesh_mocap_id] = link_pos
        data.mocap_quat[exo_mesh_mocap_id] = link_quat_wxyz
        
        # Set aruco plane with offset
        plane_body_id = mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, f"{link_name}_exo_plane")
        # Apply offset in link frame
        data.mocap_pos[model.body_mocapid[plane_body_id]] = link_pos + link_rot.apply(cfg.aruco_offset_pos / 1000)
        data.mocap_quat[model.body_mocapid[plane_body_id]] = (link_rot * R.from_euler('xyz', cfg.aruco_offset_rot)).as_quat()[[3, 0, 1, 2]]
    mujoco.mj_forward(model, data)

#Detect link poses from ArUco markers in image.
def detect_link_poses( rgb: np.ndarray, robot_config, visualize: bool = False, cam_K: np.ndarray = None):

    # Convert to uint8 if needed
    if rgb.dtype == np.float32 or rgb.dtype == np.float64: rgb = (rgb * 255).astype(np.uint8)
    
    # Detect all markers once
    gray = cv2.cvtColor(rgb, cv2.COLOR_RGB2GRAY)
    corners_cache = cv2.aruco.detectMarkers(gray, ARUCO_DICT, parameters=cv2.aruco.DetectorParameters())
    vis_img = rgb.copy()
    
    # Draw all detected markers
    corners, ids, rejected = corners_cache
    cv2.aruco.drawDetectedMarkers(vis_img, corners, ids)

    # Detect poses for all links (FIRST PASS: all in camera frame)
    link_poses = {}
    obj_img_pts = {}
    for link_name in robot_config.links.keys():
        cfg = robot_config.links[link_name]
        
        result = do_est_aruco_pose( rgb, ARUCO_DICT, robot_config.aruco_board_objects[link_name], cfg.board_length, cameraMatrix=cam_K, corners_est=corners_cache, corners_vis=vis_img)
        if result == -1: continue
        vis_img = result['pose_vis']
        
        # Compute link pose in camera frame
        link_to_aruco = np.block([ [R.from_euler('xyz', cfg.aruco_offset_rot).as_matrix(), cfg.aruco_offset_pos[:, None] / 1000], [np.zeros((1, 3)), 1] ])
        link_poses[link_name] = result['est_aruco_pose'] @ np.linalg.inv(link_to_aruco)
        obj_img_pts[link_name] = result['obj_img_pts']
        if link_name == "larger_base": cam_K,cam_pose,link_poses["larger_base"] = result['cameraMatrix'],link_poses[link_name],np.eye(4)
        else: link_poses[link_name] = np.linalg.inv(cam_pose) @ link_poses[link_name]
    
    if visualize: plt.imshow(cv2.cvtColor(vis_img, cv2.COLOR_BGR2RGB));plt.show()
    return link_poses, cam_pose, cam_K, corners_cache,vis_img,obj_img_pts


def detect_and_set_link_poses(rgb: np.ndarray, model: mujoco.MjModel, data: mujoco.MjData, robot_config, visualize: bool = False, cam_K: np.ndarray = None):
    """Detect link poses from ArUco markers in image and set virtual exoskeleton meshes to match."""
    link_poses, camera_pose_world, cam_K, corners_cache,corners_vis,obj_img_pts = detect_link_poses(rgb, robot_config, visualize=visualize, cam_K=cam_K)
    position_exoskeleton_meshes(robot_config, model, data, link_poses)
    return link_poses, camera_pose_world, cam_K, corners_cache,corners_vis,obj_img_pts


def detect_and_position_puck(rgb: np.ndarray, model: mujoco.MjModel, data: mujoco.MjData, puck_config, cam_K: np.ndarray, cam_pose: np.ndarray, corners_cache, visualize: bool = False) -> Optional[np.ndarray]:
    """Detect puck pose from ArUco and position it in the scene.
    
    Args:
        puck_config: PuckConfig object with ArUco board and offset info
    
    Returns:
        Puck pose (4x4 matrix) relative to base, or None if not detected
    """
    
    # Convert to uint8 if needed
    if rgb.dtype == np.float32 or rgb.dtype == np.float64: rgb = (rgb * 255).astype(np.uint8)
    
    # Detect puck ArUco
    vis_img = rgb.copy()
    result = do_est_aruco_pose(rgb, ARUCO_DICT, puck_config.aruco_board, puck_config.board_length, cameraMatrix=cam_K, corners_est=corners_cache, corners_vis=vis_img)
    if result == -1: return None

    if visualize: plt.imshow(cv2.cvtColor(result['pose_vis'], cv2.COLOR_BGR2RGB));plt.show()
    
    # Compute puck pose - transform from camera frame to robot base frame
    puck_to_aruco = np.block([ [R.from_euler('xyz', puck_config.aruco_offset_rot).as_matrix(), puck_config.aruco_offset_pos[:, None]], [np.zeros((1, 3)), 1] ])
    puck_pose_camera = result['est_aruco_pose'] @ np.linalg.inv(puck_to_aruco)
    # Transform to base frame (same as other links)
    puck_pose = np.linalg.inv(cam_pose) @ puck_pose_camera
    
    # Position puck in scene
    puck_body_id = model.body("grabbable_puck").id
    data.mocap_pos[model.body_mocapid[puck_body_id]] = puck_pose[:3, 3]
    data.mocap_quat[model.body_mocapid[puck_body_id]] = R.from_matrix(puck_pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
    
    # Position ArUco plane relative to puck
    aruco_body_id = mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, "grabbable_aruco_plane")
    aruco_pose = puck_pose @ puck_to_aruco
    data.mocap_pos[model.body_mocapid[aruco_body_id]] = aruco_pose[:3, 3]
    data.mocap_quat[model.body_mocapid[aruco_body_id]] = R.from_matrix(aruco_pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
    
    return puck_pose,result['obj_img_pts']

def detect_and_position_alignment_board(rgb: np.ndarray, model: mujoco.MjModel, data: mujoco.MjData, alignment_board_config, cam_K: np.ndarray, cam_pose: np.ndarray, corners_cache, visualize: bool = False) -> Optional[np.ndarray]:
    """Detect alignment board pose from ArUco and position it in the scene.
    
    Args:
        alignment_board_config: AlignmentBoardConfig object with ArUco board and offset info
        cam_K: Camera intrinsic matrix
        cam_pose: Camera pose in world frame (4x4 matrix)
        corners_cache: Pre-detected ArUco corners from image
    
    Returns:
        Board pose (4x4 matrix) relative to base, or None if not detected
    """
    
    # Convert to uint8 if needed
    if rgb.dtype == np.float32 or rgb.dtype == np.float64: rgb = (rgb * 255).astype(np.uint8)
    
    # Detect alignment board ArUco
    vis_img = rgb.copy()
    result = do_est_aruco_pose(rgb, ARUCO_DICT, alignment_board_config.aruco_board, alignment_board_config.board_length, cameraMatrix=cam_K, corners_est=corners_cache, corners_vis=vis_img)
    if result == -1: return None

    if visualize: plt.imshow(cv2.cvtColor(result['pose_vis'], cv2.COLOR_BGR2RGB));plt.show()
    
    # Compute board pose - transform from camera frame to robot base frame
    board_to_aruco = np.block([ [R.from_euler('xyz', alignment_board_config.aruco_offset_rot).as_matrix(), alignment_board_config.aruco_offset_pos[:, None]], [np.zeros((1, 3)), 1] ])
    board_pose_camera = result['est_aruco_pose'] @ np.linalg.inv(board_to_aruco)
    # Transform to base frame (same as other links)
    board_pose = np.linalg.inv(cam_pose) @ board_pose_camera
    
    # Position board in scene - the board body itself contains the ArUco plane
    board_body_id = model.body("alignment_board").id
    data.mocap_pos[model.body_mocapid[board_body_id]] = board_pose[:3, 3]
    data.mocap_quat[model.body_mocapid[board_body_id]] = R.from_matrix(board_pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
    
    return board_pose, result['obj_img_pts']

def position_puck_aruco_from_mocap(model: mujoco.MjModel, data: mujoco.MjData, puck_config) -> np.ndarray:
    """Position ArUco marker based on puck's current mocap pose.
    
    Args:
        model: MuJoCo model
        data: MuJoCo data
        puck_config: PuckConfig object with ArUco offset info
    
    Returns:
        ArUco pose (4x4 matrix) in world frame
    """
    # Get puck mocap pose
    puck_body_id = model.body("grabbable_puck").id
    puck_mocap_id = model.body_mocapid[puck_body_id]
    puck_pos = data.mocap_pos[puck_mocap_id]
    puck_quat_wxyz = data.mocap_quat[puck_mocap_id]
    puck_pose = np.block([[R.from_quat(puck_quat_wxyz[[1, 2, 3, 0]]).as_matrix(), puck_pos[:, None]], [np.zeros((1, 3)), 1]])
    
    # Calculate ArUco pose
    puck_to_aruco = np.block([[R.from_euler('xyz', puck_config.aruco_offset_rot).as_matrix(), puck_config.aruco_offset_pos[:, None]], [np.zeros((1, 3)), 1]])
    aruco_pose = puck_pose @ puck_to_aruco
    
    # Update ArUco marker position
    data.mocap_pos[model.body_mocapid[model.body("grabbable_aruco_plane").id]] = aruco_pose[:3, 3]
    data.mocap_quat[model.body_mocapid[model.body("grabbable_aruco_plane").id]] = R.from_matrix(aruco_pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
    
    return aruco_pose

def track_aruco_with_ik(model: mujoco.MjModel, data: mujoco.MjData, puck_config, configuration, dt: float, visualize_target: bool = True) -> np.ndarray:
    """Use IK to track ArUco marker with fixed offset.
    """

    # Flip to front side by rotating 180 degrees around Y-axis and negating the position
    # Move gripper up by 0.02m (20mm) relative to puck
    aruco_to_ee_offset = np.block([[ R.from_euler('xyz', [-3.14159265, 1.57000633, -1.60001057]).as_matrix() @ R.from_euler('xyz', [0, np.pi, 0]).as_matrix(), -np.array([-0.01096988+.02, -0.00597524+.01, -0.01664 + 0.00])[:, None] ], [np.zeros((1, 3)), 1]]) # hardcoded offset from aruco to grasp (front side, moved up)
    #old pos aruco_to_ee_offset =  aruco_to_ee_offset = np.block([[ R.from_euler('xyz', [-3.14159265, 1.57000633, -1.60001057]).as_matrix(), np.array([-0.01096988, -0.00597524, -0.01664])[:, None] ], [np.zeros((1, 3)), 1]]) # hardcoded offset from aruco to grasp

    
    # Update ArUco pose from puck mocap (reads interactive position when dragged)
    aruco_pose = position_puck_aruco_from_mocap(model, data, puck_config)
    target_ee_pose = aruco_pose @ aruco_to_ee_offset
    
    # Visualize the target using the green "target" mocap sphere
    if visualize_target:
        target_body_id = mujoco.mj_name2id(model, mujoco.mjtObj.mjOBJ_BODY, "target")
        data.mocap_pos[model.body_mocapid[target_body_id]] = target_ee_pose[:3, 3]
        data.mocap_quat[model.body_mocapid[target_body_id]] = R.from_matrix(target_ee_pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
    
    # IK to maintain offset
    ee_task = mink.FrameTask(frame_name="end_effector", frame_type="site", position_cost=1, orientation_cost=.1)
    ee_task.set_target(mink.SE3(wxyz_xyz=np.concatenate([R.from_matrix(target_ee_pose[:3, :3]).as_quat()[[3,0,1,2]], target_ee_pose[:3, 3]])))
    
    posture_task = mink.PostureTask(model, cost=1e-3)
    posture_task.set_target(data.qpos)
    
    vel = mink.solve_ik(configuration, [ee_task, posture_task], dt, "daqp", limits=[mink.ConfigurationLimit(model)])
    configuration.integrate_inplace(vel, dt)
    data.qpos[:] = configuration.q
    mujoco.mj_forward(model, data)

    # Return velocity error as a measure of IK convergence
    return np.linalg.norm(vel)


def combine_xmls(base_xml: str, *additions: str) -> str:
    xml = base_xml
    for addition in additions: xml = xml.replace('</mujoco>', addition + '\n</mujoco>')
    return xml


def render_from_camera_pose(model: mujoco.MjModel, data: mujoco.MjData, cam_pose: np.ndarray, cam_K: np.ndarray, height: int, width: int,segmentation: bool = False):
    """Render scene from estimated camera pose.
    
    Returns:
        Rendered image (numpy array)
    """
    from mujoco.renderer import Renderer
    renderer = Renderer(model, height=height, width=width)
    cam_id = model.cam('estimated_camera').id

    if segmentation: renderer.enable_segmentation_rendering()
    
    # Set camera position and orientation
    data.cam_xpos[cam_id] = np.linalg.inv(cam_pose)[:3, 3]
    data.cam_xmat[cam_id] = (np.array([[1, 0, 0], [0, -1, 0], [0, 0, -1]]) @ cam_pose[:3, :3]).T.reshape(-1)
    
    # Set FOV from camera matrix
    model.cam_fovy[cam_id] = np.degrees(2 * np.arctan(height / (2 * cam_K[1, 1])))
    
    renderer.update_scene(data, camera=cam_id)
    return renderer.render()


def estimate_robot_state(
    model: mujoco.MjModel,
    data: mujoco.MjData,
    robot_config,
    link_poses,
    ik_iterations: int = 15,
    position_cost: float = 1.0,
    orientation_cost: float = 0.03,
    enforce_limits: bool = True,
    return_error: bool = False,
):
    """Estimate robot joint configuration from link poses (e.g. fixed_gripper, moveable_gripper).

    Uses IK to fit the two gripper link poses. When enforce_limits=False, joint limits are
    not applied so the solution can match the detected poses even if they are not reachable
    by the real robot (useful for visualization or training targets).

    Returns:
        configuration: mink.Configuration with solved joint state
        ik_error: dict with "position_mm" (mean position error in mm) and "orientation_deg" (mean angular error in deg)
    """
    configuration = mink.Configuration(model)
    configuration.update(data.qpos)

    tasks = []
    link_info = []  # (link_name, pyb_name, target_pose) for error computation
    link_name_map = {cfg.pybullet_name: link_name for link_name, cfg in robot_config.links.items()}
    for link_name in link_poses:
        if link_name not in link_name_map.values():
            continue
        pyb_name = [k for k, v in link_name_map.items() if v == link_name][0]
        task = mink.FrameTask(
            frame_name=pyb_name,
            frame_type="body",
            position_cost=position_cost,
            orientation_cost=orientation_cost,
        )
        pose = np.asarray(link_poses[link_name])
        quat_wxyz = R.from_matrix(pose[:3, :3]).as_quat()[[3, 0, 1, 2]]
        xyz = pose[:3, 3]
        task.set_target(mink.SE3(wxyz_xyz=np.concatenate([quat_wxyz, xyz])))
        tasks.append(task)
        link_info.append((link_name, pyb_name, pose))

    limits = [mink.ConfigurationLimit(model=model)] if enforce_limits else []
    for _ in range(ik_iterations):
        vel = mink.solve_ik(configuration, tasks, 0.005, "daqp", limits=limits)
        configuration.integrate_inplace(vel, 0.005)

    # Compute IK error: FK with solution, then compare to targets
    data.qpos[:] = configuration.q
    mujoco.mj_forward(model, data)
    pos_errors_mm = []
    orient_errors_deg = []
    for link_name, pyb_name, target_pose in link_info:
        body_id = model.body(pyb_name).id
        current_pos = data.xpos[body_id]
        current_quat_wxyz = data.xquat[body_id]
        target_pos = target_pose[:3, 3]
        target_rot = R.from_matrix(target_pose[:3, :3])
        current_rot = R.from_quat(current_quat_wxyz[[1, 2, 3, 0]])  # wxyz -> xyzw
        pos_errors_mm.append(1000.0 * np.linalg.norm(current_pos - target_pos))
        orient_errors_deg.append(np.degrees((target_rot * current_rot.inv()).magnitude()))
    ik_error = {
        "position_mm": float(np.mean(pos_errors_mm)) if pos_errors_mm else 0.0,
        "orientation_deg": float(np.mean(orient_errors_deg)) if orient_errors_deg else 0.0,
    }
    if return_error: return configuration, ik_error
    else: return configuration