Merge branch 'main' into sample_gradient_v2

thowell · web-flow · commit 7eaf68d75b65 · 2024-01-31T18:40:58.000-08:00
diff --git a/mjpc/CMakeLists.txt b/mjpc/CMakeLists.txt
@@ -177,6 +177,28 @@ if(APPLE)
   target_link_libraries(mjpc "-framework Cocoa")
 endif()
 
+add_executable(
+  testspeed
+  testspeed_app.cc
+  testspeed.h
+  testspeed.cc
+)
+target_link_libraries(
+  testspeed
+  absl::flags
+  absl::flags_parse
+  absl::random_random
+  absl::strings
+  libmjpc
+  mujoco::mujoco
+  threadpool
+  Threads::Threads
+)
+target_include_directories(testspeed PRIVATE ${CMAKE_CURRENT_SOURCE_DIR}/..)
+target_compile_options(testspeed PUBLIC ${MJPC_COMPILE_OPTIONS})
+target_link_options(testspeed PRIVATE ${MJPC_LINK_OPTIONS})
+target_compile_definitions(testspeed PRIVATE MJSIMULATE_STATIC)
+
 add_subdirectory(tasks)
 
 if(BUILD_TESTING AND MJPC_BUILD_TESTS)
diff --git a/mjpc/tasks/cube/cube_3x3x3.xml.patch b/mjpc/tasks/cube/cube_3x3x3.xml.patch
@@ -23,7 +23,7 @@ diff --git a/cube_3x3x3_modified.xml b/cube_3x3x3_modified.xml
      <default class="cubelet">
 -      <joint type="ball" armature="0.0001" damping="0.0005" frictionloss="0.001"/>
 -      <geom type="mesh" condim="1" mesh="cubelet" euler="0 0 90"/>
-+      <joint type="ball" armature="0.00005" damping="0.0001" frictionloss="0.00005"/>
++      <joint type="ball" armature="0.0001" damping="0.0005" frictionloss="0.00005"/>
 +      <geom type="mesh" condim="1" mesh="cubelet" quat="1 0 0 1"/>
      </default>
      <default class="core">
diff --git a/mjpc/tasks/cube/solve.cc b/mjpc/tasks/cube/solve.cc
@@ -15,6 +15,7 @@
 #include "mjpc/tasks/cube/solve.h"
 
 #include <algorithm>
+#include <iostream>
 #include <random>
 #include <string>
 
@@ -131,6 +132,7 @@ void CubeSolve::ResidualFn::Residual(const mjModel* model, const mjData* data,
 void CubeSolve::TransitionLocked(mjModel* model, mjData* data) {
   if (transition_model_) {
     if (mode == kModeWait) {
+      weight[11] = .01;  // add penalty on joint movement
       // wait
     } else if (mode == kModeScramble) {  // scramble
       double scramble_param = parameters[6];
@@ -190,9 +192,11 @@ void CubeSolve::TransitionLocked(mjModel* model, mjData* data) {
 
       // set face goal index
       goal_index_ = num_scramble - 1;
+      std::cout << "rotations required: " << num_scramble << "\n";
 
       // set to solve
       mode = kModeSolve;
+      weight[11] = 0;  // remove penalty on joint movement
     } else if (mode == kModeSolve) {  // solve
       // set goal
       mju_copy(parameters.data(), goal_cache_.data() + 6 * goal_index_, 6);
@@ -204,7 +208,9 @@ void CubeSolve::TransitionLocked(mjModel* model, mjData* data) {
       if (mju_norm(error, 6) < 0.085) {
         if (goal_index_ == 0) {
           mode = kModeWait;
+          std::cout << "solved!\n";
         } else {
+          std::cout << "rotations remaining: " << goal_index_ << "\n";
           goal_index_--;
         }
       }
@@ -213,11 +219,10 @@ void CubeSolve::TransitionLocked(mjModel* model, mjData* data) {
 
   // check for drop
   if (data->qpos[6] < kResetHeight) {
-    // reset cube position + orientation
-    mju_copy(data->qpos, model->key_qpos, 7);
+    if (mode != kModeWait) { std::cout << "cube fell\n"; }
 
-    // reset cube velocity
-    mju_zero(data->qvel, 6);
+    // stop optimization
+    mode = kModeWait;
   }
 
   // check goal index
diff --git a/mjpc/tasks/cube/task.xml b/mjpc/tasks/cube/task.xml
@@ -12,8 +12,8 @@
     <numeric name="agent_policy_width" data="0.0035" />
     <numeric name="sampling_spline_points" data="6" />
     <numeric name="sampling_exploration" data="0.1" />
-    <numeric name="sampling_trajectories" data="20" />
-    <numeric name="sampling_representation" data="0" />
+    <numeric name="sampling_trajectories" data="60" />
+    <numeric name="sampling_representation" data="1" />
     <!-- manual face goals -->
     <numeric name="residual_Red" data="0 -3.14 3.14"/>
     <numeric name="residual_Orange" data="0 -3.14 3.14"/>
diff --git a/mjpc/tasks/tasks.cc b/mjpc/tasks/tasks.cc
@@ -17,6 +17,7 @@
 #include <memory>
 #include <vector>
 
+#include "mjpc/task.h"
 #include "mjpc/tasks/acrobot/acrobot.h"
 #include "mjpc/tasks/cube/solve.h"
 #include "mjpc/tasks/cartpole/cartpole.h"
diff --git a/mjpc/testspeed.cc b/mjpc/testspeed.cc
@@ -0,0 +1,128 @@
+// Copyright 2024 DeepMind Technologies Limited
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "mjpc/testspeed.h"
+
+#include <chrono>
+#include <cmath>
+#include <iostream>
+#include <string>
+#include <vector>
+
+#include <mujoco/mujoco.h>
+
+#include "mjpc/agent.h"
+#include "mjpc/states/state.h"
+#include "mjpc/task.h"
+#include "mjpc/threadpool.h"
+#include "mjpc/utilities.h"
+#include "mjpc/tasks/tasks.h"
+
+namespace mjpc {
+
+namespace {
+Task* task;
+void residual_callback(const mjModel* model, mjData* data, int stage) {
+  if (stage == mjSTAGE_ACC) {
+    task->Residual(model, data, data->sensordata);
+  }
+}
+}  // namespace
+
+// Run synchronous planning, print timing info,return 0 if nothing failed.
+int TestSpeed(std::string task_name, int planner_thread_count,
+              int steps_per_planning_iteration, double total_time) {
+  std::cout << "Test MJPC Speed\n";
+  std::cout << " MuJoCo version " << mj_versionString() << "\n";
+  if (mjVERSION_HEADER != mj_version()) {
+    mju_error("Headers and library have Different versions");
+  }
+  std::cout << " Hardware threads:  " << NumAvailableHardwareThreads() << "\n";
+
+  Agent agent;
+  agent.SetTaskList(GetTasks());
+  agent.gui_task_id = agent.GetTaskIdByName(task_name);
+  if (agent.gui_task_id == -1) {
+    std::cerr << "Invalid --task flag: '" << task_name
+              << "'. Valid values:\n";
+    std::cerr << agent.GetTaskNames();
+    return -1;
+  }
+  auto load_model = agent.LoadModel();
+  mjModel* model = load_model.model.release();
+  if (!model) {
+    std::cerr << load_model.error << "\n";
+    return 1;
+  }
+  mjData* data = mj_makeData(model);
+  mj_forward(model, data);
+
+  int home_id = mj_name2id(model, mjOBJ_KEY, "home");
+  if (home_id >= 0) {
+    std::cout << "home_id: " << home_id << "\n";
+    mj_resetDataKeyframe(model, data, home_id);
+  }
+
+  // the planner and its initial configuration is set in the XML
+  agent.estimator_enabled = false;
+  agent.Initialize(model);
+  agent.Allocate();
+  agent.Reset(data->ctrl);
+  agent.plan_enabled = true;
+
+  // make task available for global callback:
+  task = agent.ActiveTask();
+  mjcb_sensor = &residual_callback;
+
+  std::cout << " Planning threads:  " << planner_thread_count << "\n";
+  ThreadPool pool(planner_thread_count);
+
+  int total_steps = ceil(total_time / model->opt.timestep);
+  int current_time = 0;
+  double total_cost = 0;
+  auto loop_start = std::chrono::steady_clock::now();
+  for (int i = 0; i < total_steps; i++) {
+    agent.ActiveTask()->Transition(model, data);
+    agent.state.Set(model, data);
+
+    agent.ActivePlanner().ActionFromPolicy(
+        data->ctrl, agent.state.state().data(),
+        agent.state.time(), /*use_previous=*/false);
+    mj_step(model, data);
+    double cost = agent.ActiveTask()->CostValue(data->sensordata);
+    total_cost += cost;
+
+    if (i % steps_per_planning_iteration == 0) { agent.PlanIteration(&pool); }
+
+    if (floor(data->time) > current_time) {
+      current_time++;
+      std::cout << "sim time: " << current_time << ", cost: " << cost << "\n";
+    }
+  }
+  auto wall_run_time = std::chrono::duration_cast<std::chrono::microseconds>(
+                            std::chrono::steady_clock::now() - loop_start)
+                            .count() /
+                        1e6;
+  std::cout << "Total wall time ("
+            << (int)ceil(total_steps / steps_per_planning_iteration)
+            << " planning steps): " << wall_run_time << " s ("
+            << total_time / wall_run_time << "x realtime)\n";
+  std::cout << "Average cost per step (lower is better): "
+            << total_cost / total_steps << "\n";
+
+  mj_deleteData(data);
+  mj_deleteModel(model);
+  return 0;
+}
+}  // namespace mjpc
diff --git a/mjpc/testspeed.h b/mjpc/testspeed.h
@@ -0,0 +1,25 @@
+// Copyright 2024 DeepMind Technologies Limited
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef MJPC_MJPC_TESTSPEED_H_
+#define MJPC_MJPC_TESTSPEED_H_
+
+#include <string>
+
+namespace mjpc {
+int TestSpeed(std::string task_name, int planner_thread_count,
+              int steps_per_planning_iteration, double total_time);
+}  // namespace mjpc
+
+#endif  // MJPC_MJPC_TESTSPEED_H_
diff --git a/mjpc/testspeed_app.cc b/mjpc/testspeed_app.cc
@@ -0,0 +1,39 @@
+// Copyright 2024 DeepMind Technologies Limited
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <string>
+
+#include <absl/flags/parse.h>
+#include <absl/flags/flag.h>
+
+#include "mjpc/testspeed.h"
+#include "mjpc/utilities.h"
+
+ABSL_FLAG(std::string, task, "Cube Solving", "Which model to load on startup.");
+ABSL_FLAG(int, planner_thread, mjpc::NumAvailableHardwareThreads() - 5,
+          "Number of planner threads to use.");
+ABSL_FLAG(int, steps_per_planning_iteration, 4,
+          "How many physics steps to take between planning iterations.");
+ABSL_FLAG(double, total_time, 10, "Total time to simulate (seconds).");
+
+int main(int argc, char** argv) {
+  absl::ParseCommandLine(argc, argv);
+  std::string task_name = absl::GetFlag(FLAGS_task);
+  int planner_thread_count = absl::GetFlag(FLAGS_planner_thread);
+  int steps_per_planning_iteration =
+      absl::GetFlag(FLAGS_steps_per_planning_iteration);
+  double total_time = absl::GetFlag(FLAGS_total_time);
+  return mjpc::TestSpeed(task_name, planner_thread_count,
+                         steps_per_planning_iteration, total_time);
+}
diff --git a/mjpc/testspeed_test.cc b/mjpc/testspeed_test.cc
@@ -0,0 +1,27 @@
+// Copyright 2024 DeepMind Technologies Limited
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "mjpc/testspeed.h"
+
+#include "gtest/gtest.h"
+
+namespace {
+
+TEST(TestSeed, Test) {
+  EXPECT_EQ(
+      mjpc::TestSpeed("Cartpole", /*planner_thread_count=*/10,
+                      /*steps_per_planning_iteration=*/10, /*total_time=*/10),
+      0);
+}
+}  // namespace