Add a utility module for performing inverse kinematics on MuJoCo models

alimuldal · alimuldal · commit a56b45194819 · 2018-10-10T20:25:39.000+01:00
PiperOrigin-RevId: 207116592
diff --git a/dm_control/mujoco/testing/assets/arm.xml b/dm_control/mujoco/testing/assets/arm.xml
@@ -0,0 +1,92 @@
+<mujoco model='jaco'>
+  <compiler coordinate='local' angle='radian' eulerseq='yxz'/>
+
+  <contact>
+    <exclude body1='b_base' body2='b_1'/>
+    <exclude body1='b_finger_1' body2='b_finger_2'/>
+    <exclude body1='b_finger_1' body2='b_finger_3'/>
+    <exclude body1='b_finger_2' body2='b_finger_3'/>
+  </contact>
+
+  <default>
+    <geom contype='1' conaffinity='1' condim='3' friction='.1 .1' solimp='.95 .98 .0005' solref='0.02 1.1' density='1'/>
+    <joint type='hinge' armature='0' damping='0'
+      solimpfriction='.95 .95 0' solreffriction='.02 1' solimplimit='0 .99 .01' solreflimit='.02 1'/>
+    <default class='finger'>
+      <joint frictionloss='0.1' armature='.1' axis='0 0 1' limited='true' range='-0.15 1.2' damping='.1'/>
+      <velocity kv='0.5' ctrlrange='-1 1' gear='1' forcerange='-1.5 1.5'/>
+      <geom type='capsule' size="0.0108231 0.0145116" pos="0.0190913 -0.0112192 1.10387e-06" quat="0.475811 -0.475815 0.523071 -0.523068"/>
+    </default>
+    <default class='fingertip'>
+      <geom type='box' pos='0.065 -0.022 0' size='0.02 .005 .011' rgba='1 0 0 1'
+            quat='1 0 0 -0.235' condim='4' />
+      <site type='ellipsoid' pos='0.065 -0.022 0' size='0.02 .005 .011'
+            quat='1 0 0 -0.235'/>
+    </default>
+  </default>
+
+  <worldbody>
+    <geom name='ground' type='plane' pos='0 0 0.06' size='1 1 1' rgba='0.78 0.93 0.92 1.0' margin='0.1' gap='0.1' />
+    <body name='b_base' pos='0 0 0.005'>
+      <inertial pos='-0.000132925 -0.000516418 0.0820911' quat='0.6951 -0.00714556 0.00738537 0.71884' mass='0.00718278' diaginertia='0.00157301 0.00157269 0.00058831' />
+      <geom name='base' rgba='0 0.4470 0.7410 1' type='capsule' size="0.0350512 0.0555543" pos="-0.000132925 -0.000516418 0.0820911" quat="0.6951 -0.00714564 0.00738544 0.71884" />
+      <body name='b_1' pos='0 0 0.1535' quat='0 0 1 0'>
+        <inertial pos='-3.49946e-005 0.010651 -0.0670012' quat='0.704277 0.0627825 -0.0628 0.70435' mass='0.00644357' diaginertia='0.00172311 0.00163259 0.00042883' />
+        <joint name='joint_1' axis='0 0 -1' />
+        <geom name='link_1' rgba='0.8500 0.3250 0.0980 1' type='capsule' size="0.031417 0.0668352" pos="-3.49946e-05 0.010651 -0.0670012" quat="0.704277 0.0627825 -0.0628 0.70435" />
+        <body name='b_2' pos='0 0 -0.1185' quat='0 0 1 1'>
+          <inertial pos='0.205004 7.5835e-005 -0.0202812' quat='2.24027e-006 0.707108 5.30493e-006 0.707106' mass='0.011691' diaginertia='0.0253426 0.0250512 0.000536357' />
+          <joint name='joint_2' axis='0 0 1' range='-3.4906585 0.34906585' limited='true' />
+          <geom name='link_2' rgba='0.9290 0.6940 0.1250 1' type='capsule' size="0.0251592 0.240341" pos="0.205004 7.5835e-05 -0.0202812" quat="2.23957e-06 0.707108 5.30416e-06 0.707106" />
+          <body name='b_3' pos='0.41 0 0' quat='0 0.707107 0.707107 0'>
+            <inertial pos='0.0843942 7.48909e-006 -0.0177123' quat='-4.64469e-005 0.692702 -4.11798e-005 0.721224' mass='0.00673417' diaginertia='0.00420255 0.00409328 0.000303584' />
+            <joint name='joint_3' axis='0 0 -1' range='-4.01425728 0.872664626' limited='true' />
+            <geom name='link_3' rgba='0.4940 0.1840 0.5560 1' type='capsule' size="0.0255647 0.120643" pos="0.0843942 7.48907e-06 -0.0177123" quat="-4.64475e-05 0.692702 -4.11814e-05 0.721224" />
+            <body name='b_4' pos='0.207 0 -0.01125' quat='0 0.707107 0 -0.707107'>
+              <inertial pos='0.0101659 -4.64261e-005 -0.0369867' quat='0.965925 1.91737e-005 -0.258823 -1.40769e-005' mass='0.00221423' diaginertia='0.0001816 0.000174586 9.79319e-005' />
+              <joint name='joint_4' axis='0 0 -1' />
+              <geom name='link_4' rgba='0.4660 0.6740 0.1880 1' type='capsule' size="0.0257405 0.0289568" pos="0.0101659 -4.64261e-05 -0.0369867" quat="0.965925 1.43712e-05 -0.258823 3.85082e-06" />
+              <body name='b_5' pos='0.037 0 -0.06408' quat='0.866025 0 -0.5 0'>
+                <inertial pos='0.0101659 -4.64261e-005 -0.0369867' quat='0.965925 1.91737e-005 -0.258823 -1.40769e-005' mass='0.00221423' diaginertia='0.0001816 0.000174586 9.79319e-005' />
+                <joint name='joint_5' axis='0 0 -1' />
+                <geom name='link_5' rgba='0.3010 0.7450 0.9330 1' type='capsule' size="0.0257405 0.0289568" pos="0.0101659 -4.64261e-05 -0.0369867" quat="0.965925 1.43712e-05 -0.258823 3.85082e-06" />
+                <body name='b_hand' pos='0.037 0 -0.06408' quat='0.612372 -0.353553 -0.353553 0.612372'>
+                  <site type='sphere' size='.01' name='gripsite' pos='0 0 -.16' rgba='.5 .5 .5 .3' />
+                  <site type='sphere' size='.01' name='pinchsite' pos='0 0.015 -0.195' rgba='.5 .5 .5 .3' />
+                  <inertial pos='0.00628384 -2.92087e-005 -0.0608681' quat='0.708562 -0.0338601 -0.0358744 0.703923' mass='0.00547172' diaginertia='0.000759818 0.000676099 0.0004995' />
+                  <joint name='joint_6' axis='0 0 -1' range='-6.28319 6.28319'  limited='false'/>
+                  <geom name='link_6' rgba='0.6350 0.0780 0.1840 1' type='capsule' size="0.0368731 0.0322296" pos="0.00628384 -2.92087e-05 -0.0608681" quat="0.708562 -0.0338601 -0.0358744 0.703923"/>
+                  <!-- optional collision geom to be used if issues arise with the mesh
+                    <geom type='ellipsoid' rgba='0.6350 0.0780 0.1840 1' size='.035 .025 .01' pos='.005 0 -.117' group='1'/> -->
+                  <body name='b_finger_1' childclass='finger' pos='-0.029 .003 -0.1145' quat='-0.414818 -0.329751 -0.663854 0.52772'>
+                    <inertial pos='0.0485761 -0.000715511 0' quat='0.507589 0.507348 0.492543 0.492294' mass='0.000379077' diaginertia='4.00708e-005 4.00527e-005 2.156e-006' />
+                    <joint name='joint_finger_1'/>
+                    <geom name='finger_knuckle_1' rgba='0 0.4470 0.7410 1'/>
+                    <geom class='fingertip' name='finger_tip_1' rgba='0 0.4470 0.7410 1'/>
+                    <site class='fingertip' name='fingertip1'/>
+                  </body>
+                  <body name='b_finger_2' childclass='finger' pos='0.0295 0.0216 -0.115' quat='0.561254 -0.620653 0.321748 0.443014'>
+                    <inertial pos='0.0485761 -0.000715511 0' quat='0.507589 0.507348 0.492543 0.492294' mass='0.000379077' diaginertia='4.00708e-005 4.00527e-005 2.156e-006' />
+                    <joint name='joint_finger_2'/>
+                    <geom name='finger_knuckle_2' rgba='0.9290 0.6940 0.1250 1'/>
+                    <geom class='fingertip' name='finger_tip_2' rgba='0.9290 0.6940 0.1250 1'/>
+                    <site class='fingertip' name='fingertip2'/>
+                  </body>
+                  <body name='b_finger_3' childclass='finger' pos='0.0295 -0.0216 -0.1145' quat='0.625248 -0.567602 0.434845 0.312735'>
+                    <inertial pos='0.0485761 -0.000715511 0' quat='0.507589 0.507348 0.492543 0.492294' mass='0.000379077' diaginertia='4.00708e-005 4.00527e-005 2.156e-006' />
+                    <joint name='joint_finger_3'/>
+                    <geom name='finger_knuckle_3' rgba='0.8500 0.3250 0.0980 1'/>
+                    <geom class='fingertip' name='finger_tip_3' rgba='0.8500 0.3250 0.0980 1'/>
+                    <site class='fingertip' name='fingertip3'/>
+                  </body>
+                </body>
+              </body>
+            </body>
+          </body>
+        </body>
+      </body>
+    </body>
+  </worldbody>
+
+</mujoco>
+
diff --git a/dm_control/mujoco/testing/assets/model_with_ball_joints.xml b/dm_control/mujoco/testing/assets/model_with_ball_joints.xml
@@ -0,0 +1,21 @@
+<mujoco>
+  <default>
+    <geom type='capsule' size='0.01'/>
+    <site type='sphere' size='0.03'/>
+    <joint type='ball' damping='0.005'/>
+  </default>
+  <worldbody>
+    <body>
+      <geom fromto='0 0 0 0 0 0.1'/>
+      <body pos='0 0 0.1'>
+        <geom fromto='0 0 0 0 0.1 0.1'/>
+        <joint name='joint_1'/>
+        <body pos='0 0.1 0.1'>
+          <geom fromto='0 0 0 0 0.1 0.0'/>
+          <joint name='joint_2'/>
+          <site name='gripsite' pos='0 0.1 0'/>
+        </body>
+      </body>
+    </body>
+  </worldbody>
+</mujoco>
diff --git a/dm_control/utils/inverse_kinematics.py b/dm_control/utils/inverse_kinematics.py
@@ -0,0 +1,263 @@
+# Copyright 2017-2018 The dm_control Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or  implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+
+"""Functions for computing inverse kinematics on MuJoCo models."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import collections
+
+from absl import logging
+from dm_control.mujoco.wrapper.mjbindings import mjlib
+import numpy as np
+from six.moves import range
+
+
+_INVALID_JOINT_NAMES_TYPE = (
+    '`joint_names` must be either None, a list, a tuple, or a numpy array; '
+    'got {}.')
+_REQUIRE_TARGET_POS_OR_QUAT = (
+    'At least one of `target_pos` or `target_quat` must be specified.')
+
+IKResult = collections.namedtuple(
+    'IKResult', ['qpos', 'err_norm', 'steps', 'success'])
+
+
+def qpos_from_site_pose(physics,
+                        site_name,
+                        target_pos=None,
+                        target_quat=None,
+                        joint_names=None,
+                        tol=1e-14,
+                        rot_weight=1.0,
+                        regularization_threshold=0.1,
+                        regularization_strength=3e-2,
+                        max_update_norm=2.0,
+                        progress_thresh=20.0,
+                        max_steps=100,
+                        inplace=False):
+  """Find joint positions that satisfy a target site position and/or rotation.
+
+  Args:
+    physics: A `mujoco.Physics` instance.
+    site_name: A string specifying the name of the target site.
+    target_pos: A (3,) numpy array specifying the desired Cartesian position of
+      the site, or None if the position should be unconstrained (default).
+      One or both of `target_pos` or `target_quat` must be specified.
+    target_quat: A (4,) numpy array specifying the desired orientation of the
+      site as a quarternion, or None if the orientation should be unconstrained
+      (default). One or both of `target_pos` or `target_quat` must be specified.
+    joint_names: (optional) A list, tuple or numpy array specifying the names of
+      one or more joints that can be manipulated in order to achieve the target
+      site pose. If None (default), all joints may be manipulated.
+    tol: (optional) Precision goal for `qpos` (the maximum value of `err_norm`
+      in the stopping criterion).
+    rot_weight: (optional) Determines the weight given to rotational error
+      relative to translational error.
+    regularization_threshold: (optional) L2 regularization will be used when
+      inverting the Jacobian whilst `err_norm` is greater than this value.
+    regularization_strength: (optional) Coefficient of the quadratic penalty
+      on joint movements.
+    max_update_norm: (optional) The maximum L2 norm of the update applied to
+      the joint positions on each iteration. The update vector will be scaled
+      such that its magnitude never exceeds this value.
+    progress_thresh: (optional) If `err_norm` divided by the magnitude of the
+      joint position update is greater than this value then the optimization
+      will terminate prematurely. This is a useful heuristic to avoid getting
+      stuck in local minima.
+    max_steps: (optional) The maximum number of iterations to perform.
+    inplace: (optional) If True, `physics.data` will be modified in place.
+      Default value is False, i.e. a copy of `physics.data` will be made.
+
+  Returns:
+    An `IKResult` namedtuple with the following fields:
+      qpos: An (nq,) numpy array of joint positions.
+      err_norm: A float, the weighted sum of L2 norms for the residual
+        translational and rotational errors.
+      steps: An int, the number of iterations that were performed.
+      success: Boolean, True if we converged on a solution within `max_steps`,
+        False otherwise.
+
+  Raises:
+    ValueError: If both `target_pos` and `target_quat` are None, or if
+      `joint_names` has an invalid type.
+  """
+
+  dtype = physics.data.qpos.dtype
+
+  if target_pos is not None and target_quat is not None:
+    jac = np.empty((6, physics.model.nv), dtype=dtype)
+    err = np.empty(6, dtype=dtype)
+    jac_pos, jac_rot = jac[:3], jac[3:]
+    err_pos, err_rot = err[:3], err[3:]
+  else:
+    jac = np.empty((3, physics.model.nv), dtype=dtype)
+    err = np.empty(3, dtype=dtype)
+    if target_pos is not None:
+      jac_pos, jac_rot = jac, None
+      err_pos, err_rot = err, None
+    elif target_quat is not None:
+      jac_pos, jac_rot = None, jac
+      err_pos, err_rot = None, err
+    else:
+      raise ValueError(_REQUIRE_TARGET_POS_OR_QUAT)
+
+  update_nv = np.zeros(physics.model.nv, dtype=dtype)
+
+  if target_quat is not None:
+    site_xquat = np.empty(4, dtype=dtype)
+    neg_site_xquat = np.empty(4, dtype=dtype)
+    err_rot_quat = np.empty(4, dtype=dtype)
+
+  if not inplace:
+    physics = physics.copy(share_model=True)
+
+  # Ensure that the Cartesian position of the site is up to date.
+  mjlib.mj_fwdPosition(physics.model.ptr, physics.data.ptr)
+
+  # Convert site name to index.
+  site_id = physics.model.name2id(site_name, 'site')
+
+  # These are views onto the underlying MuJoCo buffers. mj_fwdPosition will
+  # update them in place, so we can avoid indexing overhead in the main loop.
+  site_xpos = physics.named.data.site_xpos[site_name]
+  site_xmat = physics.named.data.site_xmat[site_name]
+
+  # This is an index into the rows of `update` and the columns of `jac`
+  # that selects DOFs associated with joints that we are allowed to manipulate.
+  if joint_names is None:
+    dof_indices = slice(None)  # Update all DOFs.
+  elif isinstance(joint_names, (list, np.ndarray, tuple)):
+    if isinstance(joint_names, tuple):
+      joint_names = list(joint_names)
+    # Find the indices of the DOFs belonging to each named joint. Note that
+    # these are not necessarily the same as the joint IDs, since a single joint
+    # may have >1 DOF (e.g. ball joints).
+    indexer = physics.named.model.dof_jntid.axes.row
+    # `dof_jntid` is an `(nv,)` array indexed by joint name. We use its row
+    # indexer to map each joint name to the indices of its corresponding DOFs.
+    dof_indices = indexer.convert_key_item(joint_names)
+  else:
+    raise ValueError(_INVALID_JOINT_NAMES_TYPE.format(type(joint_names)))
+
+  steps = 0
+  success = False
+
+  for steps in range(max_steps):
+
+    err_norm = 0.0
+
+    if target_pos is not None:
+      # Translational error.
+      err_pos[:] = target_pos - site_xpos
+      err_norm += np.linalg.norm(err_pos)
+    if target_quat is not None:
+      # Rotational error.
+      mjlib.mju_mat2Quat(site_xquat, site_xmat)
+      mjlib.mju_negQuat(neg_site_xquat, site_xquat)
+      mjlib.mju_mulQuat(err_rot_quat, target_quat, neg_site_xquat)
+      mjlib.mju_quat2Vel(err_rot, err_rot_quat, 1)
+      err_norm += np.linalg.norm(err_rot) * rot_weight
+
+    if err_norm < tol:
+      logging.debug('Converged after %i steps: err_norm=%3g', steps, err_norm)
+      success = True
+      break
+    else:
+      # TODO(b/112141670): Generalize this to other entities besides sites.
+      mjlib.mj_jacSite(
+          physics.model.ptr, physics.data.ptr, jac_pos, jac_rot, site_id)
+      jac_joints = jac[:, dof_indices]
+
+      # TODO(b/112141592): This does not take joint limits into consideration.
+      reg_strength = (
+          regularization_strength if err_norm > regularization_threshold
+          else 0.0)
+      update_joints = nullspace_method(
+          jac_joints, err, regularization_strength=reg_strength)
+
+      update_norm = np.linalg.norm(update_joints)
+
+      # Check whether we are still making enough progress, and halt if not.
+      progress_criterion = err_norm / update_norm
+      if progress_criterion > progress_thresh:
+        logging.debug('Step %2i: err_norm / update_norm (%3g) > '
+                      'tolerance (%3g). Halting due to insufficient progress',
+                      steps, progress_criterion, progress_thresh)
+        break
+
+      if update_norm > max_update_norm:
+        update_joints *= max_update_norm / update_norm
+
+      # Write the entries for the specified joints into the full `update_nv`
+      # vector.
+      update_nv[dof_indices] = update_joints
+
+      # Update `physics.qpos`, taking quaternions into account.
+      mjlib.mj_integratePos(physics.model.ptr, physics.data.qpos, update_nv, 1)
+
+      # Compute the new Cartesian position of the site.
+      mjlib.mj_fwdPosition(physics.model.ptr, physics.data.ptr)
+
+      logging.debug('Step %2i: err_norm=%-10.3g update_norm=%-10.3g',
+                    steps, err_norm, update_norm)
+
+  if not success and steps == max_steps - 1:
+    logging.warning('Failed to converge after %i steps: err_norm=%3g',
+                    steps, err_norm)
+
+  if not inplace:
+    # Our temporary copy of physics.data is about to go out of scope, and when
+    # it does the underlying mjData pointer will be freed and physics.data.qpos
+    # will be a view onto a block of deallocated memory. We therefore need to
+    # make a copy of physics.data.qpos while physics.data is still alive.
+    qpos = physics.data.qpos.copy()
+  else:
+    # If we're modifying physics.data in place then it's fine to return a view.
+    qpos = physics.data.qpos
+
+  return IKResult(qpos=qpos, err_norm=err_norm, steps=steps, success=success)
+
+
+def nullspace_method(jac_joints, delta, regularization_strength=0.0):
+  """Calculates the joint velocities to achieve a specified end effector delta.
+
+  Args:
+    jac_joints: The Jacobian of the end effector with respect to the joints. A
+      numpy array of shape `(ndelta, nv)`, where `ndelta` is the size of `delta`
+      and `nv` is the number of degrees of freedom.
+    delta: The desired end-effector delta. A numpy array of shape `(3,)` or
+      `(6,)` containing either position deltas, rotation deltas, or both.
+    regularization_strength: (optional) Coefficient of the quadratic penalty
+      on joint movements. Default is zero, i.e. no regularization.
+
+  Returns:
+    An `(nv,)` numpy array of joint velocities.
+
+  Reference:
+    Buss, S. R. S. (2004). Introduction to inverse kinematics with jacobian
+    transpose, pseudoinverse and damped least squares methods.
+    https://www.math.ucsd.edu/~sbuss/ResearchWeb/ikmethods/iksurvey.pdf
+  """
+  hess_approx = jac_joints.T.dot(jac_joints)
+  joint_delta = jac_joints.T.dot(delta)
+  if regularization_strength > 0:
+    # L2 regularization
+    hess_approx += np.eye(hess_approx.shape[0]) * regularization_strength
+    return np.linalg.solve(hess_approx, joint_delta)
+  else:
+    return np.linalg.lstsq(hess_approx, joint_delta)[0]
diff --git a/dm_control/utils/inverse_kinematics_test.py b/dm_control/utils/inverse_kinematics_test.py