Spaces:

Daankular
/

Image2Model

Running on Zero

App Files Files Community

Image2Model / Retarget /animate.py

Daankular

Port MeshForge features to ZeroGPU Space: FireRed, PSHuman, Motion Search

8f1bcd9 2 days ago

raw

history blame contribute delete

27.8 kB

	"""
	animate.py
	──────────────────────────────────────────────────────────────────────────────
	Bake SMPL motion (from HumanML3D [T, 263] features) onto a UniRig-rigged GLB.

	Retargeting method: world-direction matching
	────────────────────────────────────────────
	Commercial retargeters (Mixamo, Rokoko, MotionBuilder) avoid rest-pose
	convention mismatches by matching WORLD BONE DIRECTIONS, not local rotations.

	Algorithm (per frame, per bone):
	1. Run t2m FK with HumanML3D 6D rotations → world bone direction d_t2m
	2. Flip X axis: t2m +X = character's LEFT; SMPL/UniRig +X = character's RIGHT
	So d_desired = (-d_t2m_x, d_t2m_y, d_t2m_z) in SMPL/UniRig world frame
	3. d_rest = normalize(ur_pos[bone] - ur_pos[parent]) from GLB inverse bind matrices
	4. R_world = R_between(d_rest, d_desired) -- minimal rotation in world space
	5. local_rot = inv(R_world[parent]) @ R_world[bone]
	6. pose_rot_delta = inv(rest_r) @ local_rot -- composing with glTF rest rotation

	This avoids all rest-pose convention issues:
	- t2m canonical arms point DOWN: handled automatically
	- t2m canonical hips/shoulders have inverted X: handled by the X-flip
	- UniRig non-identity rest rotations: handled by inv(rest_r) composition

	Key bugs fixed vs previous version:
	- IBM column-major: glTF IBMs are column-major; was using inv(ibm)[:3,3] (zeros).
	Fixed to inv(ibm.T)[:3,3] which gives correct world-space bone positions.
	- Normalisation: was mixing ur/smpl Y ranges, causing wrong height alignment.
	Fixed with independent per-skeleton Y normalisation.
	- Rotation convention: was applying t2m rotations directly without X-flip.
	Fixed by world-direction matching with coordinate-frame conversion.
	"""
	from __future__ import annotations
	import os
	import re
	import numpy as np
	from typing import Union

	from .smpl import SMPLMotion, hml3d_to_smpl_motion


	# ──────────────────────────────────────────────────────────────────────────────
	# T2M (HumanML3D) skeleton constants
	# Source: HumanML3D/common/paramUtil.py
	# ──────────────────────────────────────────────────────────────────────────────

	T2M_RAW_OFFSETS = np.array([
	[ 0, 0, 0], # 0 Hips (root)
	[ 1, 0, 0], # 1 LeftUpLeg +X = character LEFT in t2m convention
	[-1, 0, 0], # 2 RightUpLeg
	[ 0, 1, 0], # 3 Spine
	[ 0,-1, 0], # 4 LeftLeg
	[ 0,-1, 0], # 5 RightLeg
	[ 0, 1, 0], # 6 Spine1
	[ 0,-1, 0], # 7 LeftFoot
	[ 0,-1, 0], # 8 RightFoot
	[ 0, 1, 0], # 9 Spine2
	[ 0, 0, 1], # 10 LeftToeBase
	[ 0, 0, 1], # 11 RightToeBase
	[ 0, 1, 0], # 12 Neck
	[ 1, 0, 0], # 13 LeftShoulder +X = character LEFT
	[-1, 0, 0], # 14 RightShoulder
	[ 0, 0, 1], # 15 Head
	[ 0,-1, 0], # 16 LeftArm arms hang DOWN in t2m canonical
	[ 0,-1, 0], # 17 RightArm
	[ 0,-1, 0], # 18 LeftForeArm
	[ 0,-1, 0], # 19 RightForeArm
	[ 0,-1, 0], # 20 LeftHand
	[ 0,-1, 0], # 21 RightHand
	], dtype=np.float64)

	T2M_KINEMATIC_CHAIN = [
	[0, 2, 5, 8, 11], # Hips -> RightUpLeg -> RightLeg -> RightFoot -> RightToe
	[0, 1, 4, 7, 10], # Hips -> LeftUpLeg -> LeftLeg -> LeftFoot -> LeftToe
	[0, 3, 6, 9, 12, 15], # Hips -> Spine -> Spine1 -> Spine2 -> Neck -> Head
	[9, 14, 17, 19, 21], # Spine2 -> RightShoulder -> RightArm -> RightForeArm -> RightHand
	[9, 13, 16, 18, 20], # Spine2 -> LeftShoulder -> LeftArm -> LeftForeArm -> LeftHand
	]

	# Parent joint index for each of the 22 t2m joints
	T2M_PARENTS = [-1] * 22
	for _chain in T2M_KINEMATIC_CHAIN:
	for _k in range(1, len(_chain)):
	T2M_PARENTS[_chain[_k]] = _chain[_k - 1]

	# ──────────────────────────────────────────────────────────────────────────────
	# SMPL joint names / T-pose (for bone mapping reference)
	# ──────────────────────────────────────────────────────────────────────────────

	SMPL_NAMES = [
	"Hips", "LeftUpLeg", "RightUpLeg", "Spine",
	"LeftLeg", "RightLeg", "Spine1", "LeftFoot",
	"RightFoot", "Spine2", "LeftToeBase", "RightToeBase",
	"Neck", "LeftShoulder", "RightShoulder","Head",
	"LeftArm", "RightArm", "LeftForeArm", "RightForeArm",
	"LeftHand", "RightHand",
	]

	# Approximate T-pose joint world positions in metres (Y-up, facing +Z)
	# +X = character's RIGHT (standard SMPL/UniRig convention)
	SMPL_TPOSE = np.array([
	[ 0.000, 0.920, 0.000], # 0 Hips
	[-0.095, 0.920, 0.000], # 1 LeftUpLeg (character's left = -X)
	[ 0.095, 0.920, 0.000], # 2 RightUpLeg
	[ 0.000, 0.980, 0.000], # 3 Spine
	[-0.095, 0.495, 0.000], # 4 LeftLeg
	[ 0.095, 0.495, 0.000], # 5 RightLeg
	[ 0.000, 1.050, 0.000], # 6 Spine1
	[-0.095, 0.075, 0.000], # 7 LeftFoot
	[ 0.095, 0.075, 0.000], # 8 RightFoot
	[ 0.000, 1.120, 0.000], # 9 Spine2
	[-0.095, 0.000, -0.020], # 10 LeftToeBase
	[ 0.095, 0.000, -0.020], # 11 RightToeBase
	[ 0.000, 1.370, 0.000], # 12 Neck
	[-0.130, 1.290, 0.000], # 13 LeftShoulder
	[ 0.130, 1.290, 0.000], # 14 RightShoulder
	[ 0.000, 1.500, 0.000], # 15 Head
	[-0.330, 1.290, 0.000], # 16 LeftArm
	[ 0.330, 1.290, 0.000], # 17 RightArm
	[-0.630, 1.290, 0.000], # 18 LeftForeArm
	[ 0.630, 1.290, 0.000], # 19 RightForeArm
	[-0.910, 1.290, 0.000], # 20 LeftHand
	[ 0.910, 1.290, 0.000], # 21 RightHand
	], dtype=np.float32)

	# Name hint table: lowercase substrings -> SMPL joint index
	_NAME_HINTS: list[tuple[list[str], int]] = [
	(["hips","pelvis","root"], 0),
	(["leftupleg","l_upleg","leftthigh","lefthip","thigh_l"], 1),
	(["rightupleg","r_upleg","rightthigh","righthip","thigh_r"], 2),
	(["spine","spine0","spine_01"], 3),
	(["leftleg","leftknee","lowerleg_l","knee_l"], 4),
	(["rightleg","rightknee","lowerleg_r","knee_r"], 5),
	(["spine1","spine_02"], 6),
	(["leftfoot","l_foot","foot_l"], 7),
	(["rightfoot","r_foot","foot_r"], 8),
	(["spine2","spine_03","chest"], 9),
	(["lefttoebase","lefttoe","l_toe","toe_l"], 10),
	(["righttoebase","righttoe","r_toe","toe_r"], 11),
	(["neck"], 12),
	(["leftshoulder","leftcollar","clavicle_l"], 13),
	(["rightshoulder","rightcollar","clavicle_r"], 14),
	(["head"], 15),
	(["leftarm","upperarm_l","l_arm"], 16),
	(["rightarm","upperarm_r","r_arm"], 17),
	(["leftforearm","lowerarm_l","l_forearm"], 18),
	(["rightforearm","lowerarm_r","r_forearm"], 19),
	(["lefthand","hand_l","l_hand"], 20),
	(["righthand","hand_r","r_hand"], 21),
	]


	# ──────────────────────────────────────────────────────────────────────────────
	# Quaternion helpers (scalar-first WXYZ convention throughout)
	# ──────────────────────────────────────────────────────────────────────────────

	_ID_QUAT = np.array([1., 0., 0., 0.], dtype=np.float32)
	_ID_MAT3 = np.eye(3, dtype=np.float64)

	def _qmul(a: np.ndarray, b: np.ndarray) -> np.ndarray:
	aw, ax, ay, az = a
	bw, bx, by, bz = b
	return np.array([
	awbw - axbx - ayby - azbz,
	awbx + axbw + aybz - azby,
	awby - axbz + aybw + azbx,
	awbz + axby - aybx + azbw,
	], dtype=np.float32)

	def _qnorm(q: np.ndarray) -> np.ndarray:
	n = np.linalg.norm(q)
	return (q / n) if n > 1e-12 else _ID_QUAT.copy()

	def _qinv(q: np.ndarray) -> np.ndarray:
	"""Conjugate = inverse for unit quaternion."""
	return q * np.array([1., -1., -1., -1.], dtype=np.float32)

	def _quat_to_mat(q: np.ndarray) -> np.ndarray:
	"""WXYZ quaternion -> 3x3 rotation matrix (float64)."""
	w, x, y, z = q.astype(np.float64)
	return np.array([
	[1-2(yy+zz), 2(xy-wz), 2(xz+w*y)],
	[ 2(xy+wz), 1-2(xx+zz), 2(yz-w*x)],
	[ 2(xz-wy), 2(yz+wx), 1-2(xx+y*y)],
	], dtype=np.float64)

	def _mat_to_quat(m: np.ndarray) -> np.ndarray:
	"""3x3 rotation matrix -> WXYZ quaternion (float32, positive-W)."""
	from scipy.spatial.transform import Rotation
	xyzw = Rotation.from_matrix(m.astype(np.float64)).as_quat()
	wxyz = np.array([xyzw[3], xyzw[0], xyzw[1], xyzw[2]], dtype=np.float32)
	if wxyz[0] < 0:
	wxyz = -wxyz
	return wxyz

	def _r_between(u: np.ndarray, v: np.ndarray) -> np.ndarray:
	"""
	Minimal rotation matrix (3x3) that maps unit vector u to unit vector v.
	Uses the Rodrigues formula; handles parallel/antiparallel cases.
	"""
	u = u / (np.linalg.norm(u) + 1e-12)
	v = v / (np.linalg.norm(v) + 1e-12)
	c = float(np.dot(u, v))
	if c >= 1.0 - 1e-7:
	return _ID_MAT3.copy()
	if c <= -1.0 + 1e-7:
	# 180 degree rotation: pick any perpendicular axis
	perp = np.array([1., 0., 0.]) if abs(u[0]) < 0.9 else np.array([0., 1., 0.])
	ax = np.cross(u, perp)
	ax /= np.linalg.norm(ax)
	return 2.0 * np.outer(ax, ax) - _ID_MAT3
	ax = np.cross(u, v) # sin(theta) * rotation axis
	s = np.linalg.norm(ax)
	K = np.array([[ 0, -ax[2], ax[1]],
	[ ax[2], 0, -ax[0]],
	[-ax[1], ax[0], 0]], dtype=np.float64)
	return _ID_MAT3 + K + K @ K * ((1.0 - c) / (s * s + 1e-12))


	# ──────────────────────────────────────────────────────────────────────────────
	# GLB skin reader
	# ──────────────────────────────────────────────────────────────────────────────

	def _read_glb_skin(rigged_glb: str):
	"""
	Return (gltf, skin, ibm[n,4,4], node_trs{name->(t,r_wxyz,s)},
	bone_names[], bone_parent_map{name->parent_name_or_None}).

	ibm is stored as-read from the binary blob (column-major from glTF spec).
	Callers must use inv(ibm[i].T)[:3,3] to get correct world positions.
	"""
	import base64
	import pygltflib

	gltf = pygltflib.GLTF2().load(rigged_glb)
	if not gltf.skins:
	raise ValueError(f"No skin found in {rigged_glb}")
	skin = gltf.skins[0]

	def _raw_bytes(buf):
	if buf.uri is None:
	return bytes(gltf.binary_blob())
	if buf.uri.startswith("data:"):
	return base64.b64decode(buf.uri.split(",", 1)[1])
	from pathlib import Path
	return (Path(rigged_glb).parent / buf.uri).read_bytes()

	acc = gltf.accessors[skin.inverseBindMatrices]
	bv = gltf.bufferViews[acc.bufferView]
	raw = _raw_bytes(gltf.buffers[bv.buffer])
	start = (bv.byteOffset or 0) + (acc.byteOffset or 0)
	n = acc.count
	ibm = np.frombuffer(raw[start: start + n * 64], dtype=np.float32).reshape(n, 4, 4)

	# Build node parent map (node_index -> parent_node_index)
	node_parent: dict[int, int] = {}
	for ni, node in enumerate(gltf.nodes):
	for child_idx in (node.children or []):
	node_parent[child_idx] = ni

	joint_set = set(skin.joints)
	bone_names = []
	node_trs: dict[str, tuple] = {}
	bone_parent_map: dict[str, str \| None] = {}

	for i, j_idx in enumerate(skin.joints):
	node = gltf.nodes[j_idx]
	name = node.name or f"bone_{i}"
	bone_names.append(name)

	t = np.array(node.translation or [0., 0., 0.], dtype=np.float32)
	r_xyzw = np.array(node.rotation or [0., 0., 0., 1.], dtype=np.float32)
	s = np.array(node.scale or [1., 1., 1.], dtype=np.float32)
	r_wxyz = np.array([r_xyzw[3], r_xyzw[0], r_xyzw[1], r_xyzw[2]], dtype=np.float32)
	node_trs[name] = (t, r_wxyz, s)

	# Find parent bone (walk up node hierarchy to nearest joint)
	parent_node = node_parent.get(j_idx)
	parent_name: str \| None = None
	while parent_node is not None:
	if parent_node in joint_set:
	pnode = gltf.nodes[parent_node]
	parent_name = pnode.name or f"bone_{skin.joints.index(parent_node)}"
	break
	parent_node = node_parent.get(parent_node)
	bone_parent_map[name] = parent_name

	print(f"[GLB] {len(bone_names)} bones from skin '{skin.name or 'Armature'}'")
	return gltf, skin, ibm, node_trs, bone_names, bone_parent_map


	# ──────────────────────────────────────────────────────────────────────────────
	# Bone mapping
	# ──────────────────────────────────────────────────────────────────────────────

	def _strip_name(name: str) -> str:
	name = re.sub(r'^(mixamorig:\|j_bip_[lcr]_\|cc_base_\|bip01_\|rig:\|chr:)',
	"", name, flags=re.IGNORECASE)
	return re.sub(r'[_\-\s.]', "", name).lower()


	def build_bone_map(
	rigged_glb: str,
	verbose: bool = True,
	) -> tuple[dict, dict, float, dict, dict]:
	"""
	Map UniRig bone names -> SMPL joint index by spatial proximity + name hints.

	Returns
	-------
	bone_to_smpl : {bone_name: smpl_joint_index}
	node_trs : {bone_name: (t[3], r_wxyz[4], s[3])}
	height_scale : float (UniRig height / SMPL reference height)
	bone_parent_map : {bone_name: parent_bone_name_or_None}
	ur_pos_by_name : {bone_name: world_pos[3]}
	"""
	_gltf, _skin, ibm, node_trs, bone_names, bone_parent_map = _read_glb_skin(rigged_glb)

	# FIX: glTF IBMs are stored column-major.
	# numpy reads as row-major, so the stored data is the TRANSPOSE of the actual matrix.
	# Correct world position = inv(actual_IBM)[:3,3] = inv(ibm[i].T)[:3,3]
	ur_pos = np.array([
	np.linalg.inv(ibm[i].T)[:3, 3] for i in range(len(bone_names))
	], dtype=np.float32)

	ur_pos_by_name = {name: ur_pos[i] for i, name in enumerate(bone_names)}

	# Scale SMPL T-pose to match character height
	ur_h = ur_pos[:, 1].max() - ur_pos[:, 1].min()
	sm_h = SMPL_TPOSE[:, 1].max() - SMPL_TPOSE[:, 1].min()
	h_sc = (ur_h / sm_h) if sm_h > 1e-6 else 1.0
	sm_pos = SMPL_TPOSE * h_sc

	# FIX: Normalise ur and smpl Y ranges independently (floor=0, top=1 for each).
	# The old code used a shared reference which caused floor offsets to misalign.
	def _norm_independent(pos, own_range_min, own_range_max, x_range, z_range):
	p = pos.copy().astype(np.float64)
	y_range = (own_range_max - own_range_min) or 1.0
	p[:, 0] /= (x_range or 1.0)
	p[:, 1] = (p[:, 1] - own_range_min) / y_range
	p[:, 2] /= (z_range or 1.0)
	return p

	# Common X/Z scale (use both skeletons' width for reference)
	x_range = max(
	abs(ur_pos[:, 0].max() - ur_pos[:, 0].min()),
	abs(sm_pos[:, 0].max() - sm_pos[:, 0].min()),
	) or 1.0
	z_range = max(
	abs(ur_pos[:, 2].max() - ur_pos[:, 2].min()),
	abs(sm_pos[:, 2].max() - sm_pos[:, 2].min()),
	) or 1.0

	ur_n = _norm_independent(ur_pos, ur_pos[:, 1].min(), ur_pos[:, 1].max(), x_range, z_range)
	sm_n = _norm_independent(sm_pos, sm_pos[:, 1].min(), sm_pos[:, 1].max(), x_range, z_range)

	dist = np.linalg.norm(ur_n[:, None] - sm_n[None], axis=-1) # [M, 22]
	d_sc = 1.0 - np.clip(dist / (dist.max() + 1e-9), 0, 1)

	# Name hint score
	n_sc = np.zeros((len(bone_names), 22), dtype=np.float32)
	for mi, bname in enumerate(bone_names):
	stripped = _strip_name(bname)
	for kws, ji in _NAME_HINTS:
	if any(kw in stripped for kw in kws):
	n_sc[mi, ji] = 1.0

	combined = 0.6 * d_sc + 0.4 * n_sc # [M, 22]

	# Greedy assignment
	THRESHOLD = 0.35
	pairs = sorted(
	((mi, ji, combined[mi, ji])
	for mi in range(len(bone_names))
	for ji in range(22)),
	key=lambda x: -x[2],
	)
	bone_to_smpl: dict[str, int] = {}
	taken: set[int] = set()
	for mi, ji, score in pairs:
	if score < THRESHOLD:
	break
	bname = bone_names[mi]
	if bname in bone_to_smpl or ji in taken:
	continue
	bone_to_smpl[bname] = ji
	taken.add(ji)

	if verbose:
	n_mapped = len(bone_to_smpl)
	print(f"\n[MAP] {n_mapped}/{len(bone_names)} bones mapped to SMPL joints:")
	for bname, ji in sorted(bone_to_smpl.items(), key=lambda x: x[1]):
	print(f" {bname:<40} -> {SMPL_NAMES[ji]}")
	unmapped = [n for n in bone_names if n not in bone_to_smpl]
	if unmapped:
	preview = ", ".join(unmapped[:8])
	print(f"[MAP] {len(unmapped)} unmapped (identity): {preview}"
	+ (" ..." if len(unmapped) > 8 else ""))
	print()

	return bone_to_smpl, node_trs, h_sc, bone_parent_map, ur_pos_by_name


	# ──────────────────────────────────────────────────────────────────────────────
	# T2M forward kinematics (world rotation matrices)
	# ──────────────────────────────────────────────────────────────────────────────

	def _compute_t2m_world_rots(
	root_rot_wxyz: np.ndarray, # [4] WXYZ
	local_rots_wxyz: np.ndarray, # [21, 4] WXYZ (joints 1-21)
	) -> np.ndarray:
	"""
	Compute accumulated world rotation matrices for all 22 t2m joints at one frame.
	Matches skeleton.py's forward_kinematics_cont6d_np: each chain RESETS to R_root.

	Returns [22, 3, 3] world rotation matrices.
	"""
	R_root = _quat_to_mat(root_rot_wxyz)
	world_rots = np.zeros((22, 3, 3), dtype=np.float64)
	world_rots[0] = R_root

	for chain in T2M_KINEMATIC_CHAIN:
	R = R_root.copy() # always start from R_root (matches skeleton.py)
	for i in range(1, len(chain)):
	j = chain[i]
	R_local = _quat_to_mat(local_rots_wxyz[j - 1]) # j-1: joints 1-21
	R = R @ R_local
	world_rots[j] = R

	return world_rots


	# ──────────────────────────────────────────────────────────────────────────────
	# Keyframe builder — world-direction matching
	# ──────────────────────────────────────────────────────────────────────────────

	def build_keyframes(
	motion: SMPLMotion,
	bone_to_smpl: dict[str, int],
	node_trs: dict[str, tuple],
	height_scale: float,
	bone_parent_map: dict[str, str \| None],
	ur_pos_by_name: dict[str, np.ndarray],
	) -> list[dict]:
	"""
	Convert SMPLMotion -> List[Dict[bone_name -> (loc, rot_delta, scale)]]
	using world-direction matching retargeting.
	"""
	T = motion.num_frames
	zeros3 = np.zeros(3, dtype=np.float32)
	ones3 = np.ones(3, dtype=np.float32)

	# Topological order: root joints (si==0) first, then by SMPL joint index
	# (parents always have lower SMPL indices in the kinematic chain)
	sorted_bones = sorted(bone_to_smpl.keys(), key=lambda b: bone_to_smpl[b])

	keyframes: list[dict] = []

	for ti in range(T):
	frame: dict = {}

	# T2M world rotation matrices for this frame
	world_rots_t2m = _compute_t2m_world_rots(
	motion.root_rot[ti].astype(np.float64),
	motion.local_rot[ti].astype(np.float64),
	)

	# Track UniRig world rotations per bone (needed for child local rotations)
	world_rot_ur: dict[str, np.ndarray] = {}

	for bname in sorted_bones:
	si = bone_to_smpl[bname]
	rest_t, rest_r, _rest_s = node_trs[bname]
	rest_t = rest_t.astype(np.float32)
	rest_r_mat = _quat_to_mat(rest_r)

	# ── Root bone (si == 0): drive world translation + facing rotation ──
	if si == 0:
	world_pos = motion.root_pos[ti].astype(np.float64) * height_scale
	pose_loc = (world_pos - rest_t.astype(np.float64)).astype(np.float32)

	# Root world rotation = t2m root rotation (Y-axis only)
	R_world_root = _quat_to_mat(motion.root_rot[ti])
	world_rot_ur[bname] = R_world_root

	# pose_rot_delta = inv(rest_r) @ target_world_rot
	pose_rot_mat = rest_r_mat.T @ R_world_root
	pose_rot = _mat_to_quat(pose_rot_mat)
	frame[bname] = (pose_loc, pose_rot, ones3)
	continue

	# ── Non-root bone: world-direction matching ──────────────────────

	# T2M world bone direction (in t2m coordinate frame)
	raw_dir_t2m = world_rots_t2m[si] @ T2M_RAW_OFFSETS[si] # [3]

	# COORDINATE FRAME CONVERSION: t2m +X = character LEFT; SMPL +X = character RIGHT
	# Flip X to convert t2m world directions -> SMPL/UniRig world directions
	d_desired = np.array([-raw_dir_t2m[0], raw_dir_t2m[1], raw_dir_t2m[2]])
	d_desired_norm = d_desired / (np.linalg.norm(d_desired) + 1e-12)

	# UniRig rest bone direction (from inverse bind matrices, world space)
	parent_b = bone_parent_map.get(bname)
	if parent_b and parent_b in ur_pos_by_name:
	d_rest = (ur_pos_by_name[bname] - ur_pos_by_name[parent_b]).astype(np.float64)
	else:
	d_rest = ur_pos_by_name[bname].astype(np.float64)
	d_rest_norm = d_rest / (np.linalg.norm(d_rest) + 1e-12)

	# Minimal world-space rotation: rest direction -> desired direction
	R_world_desired = _r_between(d_rest_norm, d_desired_norm) # [3, 3]
	world_rot_ur[bname] = R_world_desired

	# Local rotation = inv(parent_world) @ R_world_desired
	if parent_b and parent_b in world_rot_ur:
	R_parent = world_rot_ur[parent_b]
	else:
	R_parent = _ID_MAT3

	local_rot_mat = R_parent.T @ R_world_desired # R_parent^-1 @ R_world

	# pose_rot_delta = inv(rest_r) @ local_rot
	# (glTF applies: final = rest_r @ pose_rot_delta = local_rot)
	pose_rot_mat = rest_r_mat.T @ local_rot_mat
	pose_rot = _mat_to_quat(pose_rot_mat)

	frame[bname] = (zeros3, pose_rot, ones3)

	keyframes.append(frame)

	return keyframes


	# ──────────────────────────────────────────────────────────────────────────────
	# Public API
	# ──────────────────────────────────────────────────────────────────────────────

	def animate_glb(
	motion: Union[np.ndarray, list, SMPLMotion],
	rigged_glb: str,
	output_glb: str,
	fps: float = 20.0,
	start_frame: int = 0,
	num_frames: int = -1,
	) -> str:
	"""
	Bake a HumanML3D motion clip onto a UniRig-rigged GLB.

	Parameters
	----------
	motion : [T, 263] ndarray, list, or pre-parsed SMPLMotion
	rigged_glb : path to UniRig merge output (.glb with a skin)
	output_glb : destination path for animated GLB
	fps : frame rate embedded in the animation track
	start_frame / num_frames : optional clip range (-1 = all frames)

	Returns str absolute path to output_glb.
	"""
	from .io.gltf_io import write_gltf_animation

	# 1. Parse motion
	if isinstance(motion, SMPLMotion):
	smpl = motion
	else:
	data = np.asarray(motion, dtype=np.float32)
	if data.ndim != 2 or data.shape[1] < 193:
	raise ValueError(f"Expected [T, 263] HumanML3D features, got {data.shape}")
	smpl = hml3d_to_smpl_motion(data, fps=fps)

	# 2. Slice
	end = (start_frame + num_frames) if num_frames > 0 else smpl.num_frames
	smpl = smpl.slice(start_frame, end)
	print(f"[animate] {smpl.num_frames} frames @ {fps:.0f} fps -> {output_glb}")

	# 3. Build bone map (now returns parent map and world positions too)
	bone_to_smpl, node_trs, h_sc, bone_parent_map, ur_pos_by_name = \
	build_bone_map(rigged_glb, verbose=True)
	if not bone_to_smpl:
	raise RuntimeError(
	"build_bone_map returned 0 matches. "
	"Ensure the GLB has a valid skin with readable inverse bind matrices."
	)

	# 4. Build keyframes using world-direction matching
	keyframes = build_keyframes(smpl, bone_to_smpl, node_trs, h_sc,
	bone_parent_map, ur_pos_by_name)

	# 5. Write GLB
	out_dir = os.path.dirname(os.path.abspath(output_glb))
	if out_dir:
	os.makedirs(out_dir, exist_ok=True)

	write_gltf_animation(
	source_filepath=rigged_glb,
	dest_armature=None,
	keyframes=keyframes,
	output_filepath=output_glb,
	fps=float(fps),
	)

	return output_glb


	# Backwards-compatibility alias
	def animate_glb_from_hml3d(
	motion, rigged_glb, output_glb, fps=20, start_frame=0, num_frames=-1
	):
	return animate_glb(
	motion, rigged_glb, output_glb,
	fps=fps, start_frame=start_frame, num_frames=num_frames,
	)