Add steering policies for turtleboth and F1tenth

MIT-REALM · Mar 2, 2024 · 2df38bd · 2df38bd
1 parent 450e802
commit 2df38bd
Show file tree

Hide file tree

Showing 10 changed files with 341 additions and 3 deletions.
diff --git a/.docker/Dockerfile b/.docker/Dockerfile
@@ -7,13 +7,14 @@ RUN apt-get update && apt-get install -y \
     git \
     python3-pip \
     python3-dev \
+    python3-tk \
     ros-noetic-driver-base \
     ros-noetic-sophus \
     ros-noetic-robot-pose-ekf \
     ros-noetic-ackermann-msgs \
     ros-noetic-urg-node
 
-RUN pip3 install numpy jax pyyaml rospkg transforms3d
+RUN pip3 install numpy jax pyyaml rospkg transforms3d equinox scipy matplotlib
 
 # Install updated cmake
 RUN apt-get update \

diff --git a/pyproject.toml b/pyproject.toml
@@ -0,0 +1,4 @@
+[tool.ruff]
+select = ["F", "E", "W", "I001"]
+ignore = ["E721", "E731", "F722"]
+ignore-init-module-imports = true
diff --git a/realm_gc/rgc_control/CMakeLists.txt b/realm_gc/rgc_control/CMakeLists.txt
@@ -204,4 +204,4 @@ include_directories(
 
 ## Add folders to be run by python nosetests
 # catkin_add_nosetests(test)
-catkin_install_python(PROGRAMS scripts/robot_control_class.py DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION})
+# catkin_install_python(PROGRAMS scripts/robot_control_class.py DESTINATION ${CATKIN_PACKAGE_BIN_DESTINATION})
diff --git a/realm_gc/rgc_control/setup.py b/realm_gc/rgc_control/setup.py
@@ -5,7 +5,7 @@
 
 # fetch values from package.xml
 setup_args = generate_distutils_setup(
-    packages=["rgc_state_estimators"],
+    packages=["rgc_control"],
     package_dir={"": "src"},
 )
 

diff --git a/realm_gc/rgc_control/src/rgc_control/policies/__init__.py b/realm_gc/rgc_control/src/rgc_control/policies/__init__.py
diff --git a/realm_gc/rgc_control/src/rgc_control/policies/policy.py b/realm_gc/rgc_control/src/rgc_control/policies/policy.py
@@ -0,0 +1,28 @@
+"""Define generic control policy interface."""
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+
+
+@dataclass
+class Observation:
+    pass
+
+
+@dataclass
+class ControlAction:
+    pass
+
+
+class ControlPolicy(ABC):
+    @property
+    def observation_type(self):
+        return Observation
+
+    @property
+    def action_type(self):
+        return ControlAction
+
+    @abstractmethod
+    def compute_action(self, observation: Observation) -> ControlAction:
+        """Takes in an observation and returns a control action."""
+        pass
diff --git a/realm_gc/rgc_control/src/rgc_control/policies/tracking/__init__.py b/realm_gc/rgc_control/src/rgc_control/policies/tracking/__init__.py
diff --git a/realm_gc/rgc_control/src/rgc_control/policies/tracking/policy.py b/realm_gc/rgc_control/src/rgc_control/policies/tracking/policy.py
@@ -0,0 +1,44 @@
+"""Define a policy for trajectory tracking."""
+from rgc_control.policies.policy import ControlAction, ControlPolicy, Observation
+
+
+class TimedPose2DObservation(Pose2DObservation):
+    """The observation for a single robot's 2D pose with a timestamp."""
+
+    t: float
+
+
+class TrackingObservation(Observation):
+    """The observation for a single robot's 2D pose relative to some goal."""
+
+    pose: Pose2DObservation
+    goal: Pose2DObservation
+
+
+class TrajectoryTrackingPolicy(ControlPolicy):
+    """Tracks a trajectory given a steering controller.
+
+    args:
+        trajectory: the trajectory to track
+        controller: the controller to use to steer towards waypoints
+    """
+
+    trajectory: MultiAgentTrajectoryLinear
+    steering_controller: ControlPolicy
+
+    @property
+    def observation_type(self):
+        return TimedPose2DObservation
+
+    @property
+    def action_type(self):
+        return self.steering_controller.action_type
+
+    def compute_action(self, observation: TimedPose2DObservation) -> ControlAction:
+        """Takes in an observation and returns a control action."""
+        # Compute the desired waypoint
+        waypoint = self.trajectory(observation.t)
+
+        # Compute the control action to steer towards the waypoint
+        return self.steering_controller.compute_action(observation, waypoint)
+        return self.steering_controller.compute_action(observation, waypoint)
diff --git a/realm_gc/rgc_control/src/rgc_control/policies/tracking/steering_policies.py b/realm_gc/rgc_control/src/rgc_control/policies/tracking/steering_policies.py
@@ -0,0 +1,215 @@
+"""Define policies for steering different dynamical systems towards waypoints."""
+from dataclasses import dataclass
+
+import numpy as np
+import scipy
+
+from rgc_control.policies.policy import ControlAction, ControlPolicy, Observation
+
+
+@dataclass
+class Pose2DObservation(Observation):
+    """The observation for a single robot's 2D pose and linear speed."""
+
+    x: float
+    y: float
+    theta: float
+
+
+@dataclass
+class SteeringObservation(Observation):
+    """The observation for a single robot's 2D pose relative to some goal."""
+
+    pose: Pose2DObservation
+    goal: Pose2DObservation
+
+
+@dataclass
+class TurtlebotSteeringAction(ControlAction):
+    """The action for a turtlebot steering controller."""
+
+    linear_velocity: float
+    angular_velocity: float
+
+
+class TurtlebotSteeringPolicy(ControlPolicy):
+    """Steer a turtlebot towards a waypoint using a proportional controller."""
+
+    @property
+    def observation_type(self):
+        return SteeringObservation
+
+    @property
+    def action_type(self):
+        return TurtlebotSteeringAction
+
+    def compute_action(
+        self, observation: SteeringObservation
+    ) -> TurtlebotSteeringAction:
+        """Takes in an observation and returns a control action."""
+        # Compute the error in the turtlebot's frame
+        error = np.array(
+            [
+                observation.goal.x - observation.pose.x,
+                observation.goal.y - observation.pose.y,
+            ]
+        ).reshape(-1, 1)
+        error = (
+            np.array(
+                [
+                    [np.cos(observation.pose.theta), -np.sin(observation.pose.theta)],
+                    [np.sin(observation.pose.theta), np.cos(observation.pose.theta)],
+                ]
+            ).T  # Transpose to rotate into turtlebot frame
+            @ error
+        )
+
+        # Compute the control action
+        linear_velocity = 0.5 * error[0]  # projection along the turtlebot x-axis
+
+        # Compute the angular velocity: steer towards the goal if we're far from it
+        # (so the arctan is well defined), and align to the goal orientation
+        if linear_velocity > 0.05:
+            angular_velocity = np.arctan2(error[1], error[0])
+        else:
+            angle_error = observation.goal.theta - observation.pose.theta
+            if angle_error > np.pi:
+                angle_error -= 2 * np.pi
+            if angle_error < -np.pi:
+                angle_error += 2 * np.pi
+            angular_velocity = 0.1 * angle_error
+
+        return TurtlebotSteeringAction(
+            linear_velocity=linear_velocity.item(),
+            angular_velocity=angular_velocity.item(),
+        )
+
+
+class F1TenthSteeringAction(ControlAction):
+    """The action for a F1Tenth steering controller."""
+
+    steering_angle: float
+    acceleration: float
+
+
+class F1TenthSteeringPolicy(ControlPolicy):
+    """Steer a F1Tenth towards a waypoint using an LQR controller.
+
+    args:
+        equilibrium_state: the state around which to linearize the dynamics
+        axle_length: the distance between the front and rear axles
+        dt: the time step for the controller
+    """
+
+    def __init__(self, equilibrium_state: np.ndarray, axle_length: float, dt: float):
+        self.axle_length = axle_length
+        self.dt = dt
+
+        # Linearize the dynamics
+        self.equilibrium_state = equilibrium_state
+        A, B = self.get_AB(equilibrium_state, 0.0, 0.0)
+
+        # Compute the LQR controller about the equilibrium
+        Q = np.eye(4)
+        R = np.eye(2)
+        X = np.matrix(scipy.linalg.solve_discrete_are(A, B, Q, R))
+        self.K = np.matrix(scipy.linalg.inv(B.T * X * B + R) * (B.T * X * A))
+
+    @property
+    def observation_type(self):
+        return SteeringObservation
+
+    @property
+    def action_type(self):
+        return F1TenthSteeringAction
+
+    def get_AB(self, state, delta, a):
+        """
+        Compute the linearized dynamics matrices.
+
+        Args:
+            state (np.ndarray): The current state [x, y, theta, v]
+            delta (float): The steering angle command
+            a (float): The acceleration command
+        """
+        # Extract the state variables
+        _, _, theta, v = state
+
+        # Compute the linearized dynamics matrices
+        A = np.eye(4)
+        A[0, 2] = -v * np.sin(theta) * self.dt
+        A[0, 3] = np.cos(theta) * self.dt
+        A[1, 2] = v * np.cos(theta) * self.dt
+        A[1, 3] = np.sin(theta) * self.dt
+        A[2, 3] = (1.0 / self.axle_length) * np.tan(delta) * self.dt
+
+        B = np.zeros((4, 2))
+        B[2, 0] = (v / self.axle_length) * self.dt / np.cos(delta) ** 2
+        B[3, 1] = self.dt
+
+        return A, B
+
+    def compute_action(self, observation: SteeringObservation) -> F1TenthSteeringAction:
+        """Takes in an observation and returns a control action."""
+        state = np.array(
+            [
+                observation.pose.x,
+                observation.pose.y,
+                observation.pose.theta,
+                self.equilibrium_state[3],
+            ]
+        ).reshape(-1, 1)
+        goal = np.array(
+            [
+                observation.goal.x,
+                observation.goal.y,
+                observation.goal.theta,
+                self.equilibrium_state[3],
+            ]
+        ).reshape(-1, 1)
+        error = state - goal
+        u = -self.K * error
+
+        return F1TenthSteeringAction(
+            steering_angle=u[0].item(), acceleration=u[1].item()
+        )
+
+
+if __name__ == "__main__":
+    # Test the turtlebot steering policy
+    policy = TurtlebotSteeringPolicy()
+
+    initial_state = np.array([-1.0, -1.0, 1.0])
+    states = [initial_state.tolist()]
+    for i in range(500):
+        action = policy.compute_action(
+            SteeringObservation(
+                pose=Pose2DObservation(
+                    x=initial_state[0], y=initial_state[1], theta=initial_state[2]
+                ),
+                goal=Pose2DObservation(x=0.0, y=0.0, theta=0.0),
+            )
+        )
+        initial_state += (
+            np.array(
+                [
+                    action.linear_velocity * np.cos(initial_state[2]),
+                    action.linear_velocity * np.sin(initial_state[2]),
+                    action.angular_velocity,
+                ]
+            )
+            * 0.05
+        )
+        states.append(initial_state.tolist())
+
+    import matplotlib
+    import matplotlib.pyplot as plt
+
+    matplotlib.use("Agg")
+
+    states = np.array(states)
+    plt.plot(states[:, 0], states[:, 1])
+    plt.scatter(0.0, 0.0, c="r", label="Goal")
+    plt.scatter(states[0, 0], states[0, 1], c="g", label="Start")
+    plt.legend()
+    plt.savefig("src/realm_gc/turtlebot_steering.png")
diff --git a/realm_gc/rgc_control/src/rgc_control/policies/tracking/trajectory.py b/realm_gc/rgc_control/src/rgc_control/policies/tracking/trajectory.py
@@ -0,0 +1,46 @@
+"""Define linearly interpolated trajectories."""
+import equinox as eqx
+import jax.numpy as jnp
+from jaxtyping import Array, Float
+
+
+class LinearTrajectory2D(eqx.Module):
+    """
+    The trajectory for a single robot, represented by linear interpolation.
+
+    Time is normalized to [0, 1]
+
+    args:
+        p: the array of control points for the trajectory
+    """
+
+    p: Float[Array, "T 2"]
+
+    def __call__(self, t: Float[Array, ""]) -> Float[Array, "2"]:
+        """Return the point along the trajectory at the given time"""
+        # Interpolate each axis separately
+        return jnp.array(
+            [
+                jnp.interp(
+                    t,
+                    jnp.linspace(0, 1, self.p.shape[0]),
+                    self.p[:, i],
+                )
+                for i in range(2)
+            ]
+        )
+
+
+class MultiAgentTrajectoryLinear(eqx.Module):
+    """
+    The trajectory for a swarm of robots.
+
+    args:
+        trajectories: the list of trajectories for each robot.
+    """
+
+    trajectories: list[LinearTrajectory2D]
+
+    def __call__(self, t: Float[Array, ""]) -> Float[Array, "N 2"]:
+        """Return the waypoints for each agent at a given time (linear interpolate)"""
+        return jnp.array([traj(t) for traj in self.trajectories])