sim control

solve conflicts
update strong pointnet++
2025-04-09 15:17:24 +08:00 · 2025-03-13 14:49:35 +08:00 · 2025-03-13 14:48:15 +08:00 · 2025-01-23 08:58:10 +00:00 · 2025-01-07 19:32:02 +08:00 · 2025-01-05 23:57:43 +08:00
17 changed files with 725 additions and 88 deletions
--- a/app_sim.py
+++ b/app_sim.py
@@ -0,0 +1,11 @@
 from PytorchBoot.application import PytorchBootApplication
 from runners.simulator import Simulator
@PytorchBootApplication("sim")
 class SimulateApp:
    @staticmethod
    def start():
        simulator = Simulator("configs/local/simulation_config.yaml")
        simulator.run("create")
        simulator.run("simulate")
--- a/configs/local/inference_config.yaml
+++ b/configs/local/inference_config.yaml
@@ -6,16 +6,16 @@ runner:
    cuda_visible_devices: "0,1,2,3,4,5,6,7"
  experiment:
-    name: train_ab_global_only
+    name: train_ab_global_only_p++_wp
    root_dir: "experiments"
-    epoch: -1 # -1 stands for last epoch
+    epoch: 922 # -1 stands for last epoch
  test:
    dataset_list:
      - OmniObject3d_test
  blender_script_path: "/media/hofee/data/project/python/nbv_reconstruction/blender/data_renderer.py"
-  output_dir: "/media/hofee/data/results/nbv_rec_inference/global_only_ycb_241204"
+  output_dir: "/media/hofee/data/data/p++_wp"
  pipeline: nbv_reconstruction_pipeline
  voxel_size: 0.003
  min_new_area: 1.0
@@ -34,8 +34,8 @@ dataset:
  #   load_from_preprocess: True
  OmniObject3d_test:
-    root_dir: "/media/hofee/data/results/ycb_preprocessed_dataset"
+    root_dir: "/media/hofee/data/data/new_testset_output"
-    model_dir: "/media/hofee/data/data/ycb_obj"
+    model_dir: "/media/hofee/data/data/scaled_object_meshes"
    source: seq_reconstruction_dataset_preprocessed
    # split_file: "C:\\Document\\Datasets\\data_list\\OmniObject3d_test.txt"
    type: test
@@ -52,7 +52,7 @@ dataset:
 pipeline:
  nbv_reconstruction_pipeline:
    modules:
-      pts_encoder: pointnet_encoder
+      pts_encoder: pointnet++_encoder
      seq_encoder: transformer_seq_encoder
      pose_encoder: pose_encoder
      view_finder: gf_view_finder
@@ -60,6 +60,10 @@ pipeline:
    global_scanned_feat: True
 module:
  pointnet++_encoder:
    in_dim: 3
    params_name: light
  pointnet_encoder:
    in_dim: 3
    out_dim: 1024
--- a/configs/local/simulation_config.yaml
+++ b/configs/local/simulation_config.yaml
@@ -0,0 +1,36 @@
 runner:
  general:
    seed: 0
    device: cuda
    cuda_visible_devices: "0,1,2,3,4,5,6,7"
  experiment:
    name: simulation_debug
    root_dir: "experiments"
 simulation:
  robot:
    urdf_path: "assets/franka_panda/panda.urdf"
    initial_position: [0, 0, 0]  # 机械臂基座位置
    initial_orientation: [0, 0, 0]  # 机械臂基座朝向(欧拉角)
  turntable:
    radius: 0.3  # 转盘半径(米)
    height: 0.1  # 转盘高度
    center_position: [0.8, 0, 0.4]  
  target:
    obj_dir: /media/hofee/data/project/python/nbv_reconstruction/nbv_reconstruction/assets/object_meshes
    obj_name: "google_scan-box_0185"        
    scale: 1.0  # 缩放系数
    mass: 0.1   # 质量(kg)
    rgba_color: [0.8, 0.8, 0.8, 1.0]  # 目标物体颜色
  camera:
    width: 640
    height: 480
    fov: 40
    near: 0.01
    far: 5.0
 displaytable:
--- a/configs/local/strategy_generate_config.yaml
+++ b/configs/local/strategy_generate_config.yaml
@@ -15,13 +15,13 @@ runner:
    overlap_area_threshold: 30
    compute_with_normal: False
    scan_points_threshold: 10
-    overwrite: False
+    overwrite: False  
    seq_num: 10
    dataset_list:
      - OmniObject3d
 datasets:
    OmniObject3d:
-      root_dir: /media/hofee/data/results/ycb_view_data
+      root_dir: /media/hofee/data/data/test_bottle/view 
      from: 0
      to: -1 # ..-1 means end
--- a/configs/local/view_generate_config.yaml
+++ b/configs/local/view_generate_config.yaml
@@ -8,16 +8,16 @@ runner:
    root_dir: experiments
  generate:
    port: 5002
-    from: 1
+    from: 0
    to: 50 # -1 means all
-    object_dir: /media/hofee/data/data/ycb_obj
+    object_dir: /media/hofee/data/data/test_bottle/bottle_mesh
    table_model_path: /media/hofee/data/data/others/table.obj
-    output_dir: /media/hofee/data/results/ycb_view_data
+    output_dir: /media/hofee/data/data/test_bottle/view
    binocular_vision: true
    plane_size: 10
    max_views: 512
    min_views: 128
-    random_view_ratio: 0.02
+    random_view_ratio: 0.002
    min_cam_table_included_degree: 20
    max_diag: 0.7
    min_diag: 0.01
@@ -34,7 +34,7 @@ runner:
        max_y: 0.05
        min_z: 0.01
        max_z: 0.01
-        random_rotation_ratio: 0.3
+        random_rotation_ratio: 0.0
      random_objects:
        num: 4
        cluster: 0.9
--- a/configs/server/server_train_config.yaml
+++ b/configs/server/server_train_config.yaml
@@ -7,19 +7,19 @@ runner:
    parallel: False
  experiment:
-    name: train_ab_global_only_with_wp_p++_dense
+    name: train_ab_global_only_with_wp_p++_strong
    root_dir: "experiments"
    use_checkpoint: False
    epoch: -1 # -1 stands for last epoch
    max_epochs: 5000
    save_checkpoint_interval: 1
-    test_first: True  
+    test_first: False  
  train:
    optimizer:
      type: Adam
      lr: 0.0001
-    losses: 
+    losses:   
      - gf_loss
    dataset: OmniObject3d_train
  test:
@@ -39,7 +39,7 @@ dataset:
    type: train
    cache: True
    ratio: 1
-    batch_size: 80
+    batch_size: 64
    num_workers: 128
    pts_num: 8192
    load_from_preprocess: True
@@ -98,7 +98,7 @@ module:
  pointnet++_encoder:
    in_dim: 3
-    params_name: dense
+    params_name: strong
  transformer_seq_encoder:
    embed_dim: 256
@@ -110,7 +110,7 @@ module:
  gf_view_finder:
    t_feat_dim: 128
    pose_feat_dim: 256
-    main_feat_dim: 2048
+    main_feat_dim: 5120
    regression_head: Rx_Ry_and_T
    pose_mode: rot_matrix
    per_point_feature: False
--- a/core/pipeline.py
+++ b/core/pipeline.py
@@ -75,6 +75,8 @@ class NBVReconstructionPipeline(nn.Module):
    def forward_test(self, data):
        main_feat = self.get_main_feat(data)
        repeat_num = data.get("repeat_num", 1)
        main_feat = main_feat.repeat(repeat_num, 1)
        estimated_delta_rot_9d, in_process_sample = self.view_finder.next_best_view(
            main_feat
        )
--- a/core/seq_dataset.py
+++ b/core/seq_dataset.py
@@ -64,11 +64,15 @@ class SeqReconstructionDataset(BaseDataset):
            scene_max_cr_idx = 0
            frame_len = DataLoadUtil.get_scene_seq_length(self.root_dir, scene_name)
-            for i in range(frame_len):
+            for i in range(10,frame_len):
                path = DataLoadUtil.get_path(self.root_dir, scene_name, i)
                pts = DataLoadUtil.load_from_preprocessed_pts(path, "npy")
                print(pts.shape)
                if pts.shape[0] == 0:
                    continue
                else:
                    break
            print(i)
            datalist.append({
                "scene_name": scene_name,
                "first_frame": i,
@@ -180,9 +184,9 @@ if __name__ == "__main__":
    np.random.seed(seed)
    config = {
-        "root_dir": "/media/hofee/data/results/ycb_view_data",
+        "root_dir": "/media/hofee/data/data/test_bottle/view",
        "source": "seq_reconstruction_dataset",
-        "split_file": "/media/hofee/data/results/ycb_test.txt",
+        "split_file": "/media/hofee/data/data/test_bottle/test_bottle.txt",
        "load_from_preprocess": True,
        "filter_degree": 75,
        "num_workers": 0,
@@ -190,7 +194,7 @@ if __name__ == "__main__":
        "type": namespace.Mode.TEST,
    }
-    output_dir = "/media/hofee/data/results/ycb_preprocessed_dataset"
+    output_dir = "/media/hofee/data/data/test_bottle/preprocessed_dataset"
    os.makedirs(output_dir, exist_ok=True)
    ds = SeqReconstructionDataset(config)
--- a/core/seq_dataset_preprocessed.py
+++ b/core/seq_dataset_preprocessed.py
@@ -21,7 +21,7 @@ class SeqReconstructionDatasetPreprocessed(BaseDataset):
        super(SeqReconstructionDatasetPreprocessed, self).__init__(config)
        self.config = config
        self.root_dir = config["root_dir"]
-        self.real_root_dir = r"/media/hofee/data/results/ycb_view_data"
+        self.real_root_dir = r"/media/hofee/data/data/new_testset"
        self.item_list = os.listdir(self.root_dir)
    def __getitem__(self, index):
@@ -66,7 +66,7 @@ if __name__ == "__main__":
    load_from_preprocess: True
    '''
    config = {
-        "root_dir": "H:\\AI\\Datasets\\packed_test_data",
+        "root_dir": "/media/hofee/data/data/test_bottle/preprocessed_dataset",
        "source": "seq_reconstruction_dataset",
        "split_file": "H:\\AI\\Datasets\\data_list\\OmniObject3d_test.txt",
        "load_from_preprocess": True,
--- a/modules/pointnet++_encoder.py
+++ b/modules/pointnet++_encoder.py
@@ -33,6 +33,30 @@ ClsMSG_CFG_Light = {
    'DP_RATIO': 0.5,
 }
 ClsMSG_CFG_Light_2048 = {
    'NPOINTS': [512, 256, 128, None],
    'RADIUS': [[0.02, 0.04], [0.04, 0.08], [0.08, 0.16], [None, None]],
    'NSAMPLE': [[16, 32], [16, 32], [16, 32], [None, None]],
    'MLPS': [[[16, 16, 32], [32, 32, 64]],
         [[64, 64, 128], [64, 96, 128]],
         [[128, 196, 256], [128, 196, 256]],
         [[256, 256, 1024], [256, 512, 1024]]],
    'DP_RATIO': 0.5,
 }
 ClsMSG_CFG_Strong = {
    'NPOINTS': [512, 256, 128, 64, None],
    'RADIUS': [[0.02, 0.04], [0.04, 0.08], [0.08, 0.16],[0.16, 0.32], [None, None]],
    'NSAMPLE': [[16, 32], [16, 32], [16, 32], [16, 32], [None, None]],
    'MLPS': [[[16, 16, 32], [32, 32, 64]],
         [[64, 64, 128], [64, 96, 128]],
         [[128, 196, 256], [128, 196, 256]],
         [[256, 256, 512], [256, 512, 512]],
         [[512, 512, 2048], [512, 1024, 2048]]
         ],
    'DP_RATIO': 0.5,
 }
 ClsMSG_CFG_Lighter = {
    'NPOINTS': [512, 256, 128, 64, None],
    'RADIUS': [[0.01], [0.02], [0.04], [0.08], [None]],
@@ -53,6 +77,10 @@ def select_params(name):
        return ClsMSG_CFG_Lighter
    elif name == 'dense':
        return ClsMSG_CFG_Dense
    elif name == 'light_2048':
        return ClsMSG_CFG_Light_2048
    elif name == 'strong':
        return ClsMSG_CFG_Strong
    else:
        raise NotImplementedError
@@ -114,8 +142,8 @@ if __name__ == '__main__':
    seed = 100
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
-    net = PointNet2Encoder(config={"in_dim": 3, "params_name": "light"}).cuda()
+    net = PointNet2Encoder(config={"in_dim": 3, "params_name": "strong"}).cuda()
-    pts = torch.randn(2, 1024, 3).cuda()
+    pts = torch.randn(2, 2444, 3).cuda()
    print(torch.mean(pts, dim=1))
    pre = net.encode_points(pts)
    print(pre.shape)
--- a/preprocess/preprocessor.py
+++ b/preprocess/preprocessor.py
@@ -164,7 +164,7 @@ def save_scene_data(root, scene, scene_idx=0, scene_total=1,file_type="txt"):
 if __name__ == "__main__":
    #root = "/media/hofee/repository/new_data_with_normal"
-    root = r"/media/hofee/data/results/ycb_view_data"
+    root = r"/media/hofee/data/data/test_bottle/view"
    scene_list = os.listdir(root)
    from_idx = 0 # 1000
    to_idx = len(scene_list) # 1500
--- a/runners/inference_server.py
+++ b/runners/inference_server.py
@@ -12,6 +12,7 @@ from PytorchBoot.runners.runner import Runner
 from PytorchBoot.utils import Log
 from utils.pts import PtsUtil
 from beans.predict_result import PredictResult
@stereotype.runner("inferencer_server")
 class InferencerServer(Runner):
@@ -50,6 +51,7 @@ class InferencerServer(Runner):
    def get_result(self, output_data):
        pred_pose_9d = output_data["pred_pose_9d"]
        pred_pose_9d = np.asarray(PredictResult(pred_pose_9d.cpu().numpy(), None, cluster_params=dict(eps=0.25, min_samples=3)).candidate_9d_poses, dtype=np.float32)
        result = {
            "pred_pose_9d": pred_pose_9d.tolist()
        }
--- a/runners/inferencer.py
+++ b/runners/inferencer.py
@@ -83,6 +83,7 @@ class Inferencer(Runner):
                        data = test_set.__getitem__(i)
                        scene_name = data["scene_name"]
                        inference_result_path = os.path.join(self.output_dir, test_set_name, f"{scene_name}.pkl")
                        if os.path.exists(inference_result_path):
                            Log.info(f"Inference result already exists for scene: {scene_name}")
                            continue
@@ -136,81 +137,98 @@ class Inferencer(Runner):
        pred_cr_seq = [last_pred_cr]
        success = 0
        last_pts_num = PtsUtil.voxel_downsample_point_cloud(data["first_scanned_pts"][0], voxel_threshold).shape[0]
-        import time
+        #import time
        while len(pred_cr_seq) < max_iter and retry < max_retry and success < max_success:
            Log.green(f"iter: {len(pred_cr_seq)}, retry: {retry}/{max_retry}, success: {success}/{max_success}")
            combined_scanned_pts = np.vstack(scanned_view_pts)
            voxel_downsampled_combined_scanned_pts_np, inverse =  self.voxel_downsample_with_mapping(combined_scanned_pts, voxel_threshold)
            output = self.pipeline(input_data)
            pred_pose_9d = output["pred_pose_9d"]
            import ipdb; ipdb.set_trace()
            pred_pose = torch.eye(4, device=pred_pose_9d.device)
-
+            # # save pred_pose_9d ------
-            pred_pose[:3,:3] = PoseUtil.rotation_6d_to_matrix_tensor_batch(pred_pose_9d[:,:6])[0]
+            # root = "/media/hofee/data/project/python/nbv_reconstruction/nbv_reconstruction/temp_output_result"
-            pred_pose[:3,3] = pred_pose_9d[0,6:]
+            # scene_dir = os.path.join(root, scene_name)
-            
+            # if not os.path.exists(scene_dir):
-            try:
+            #     os.makedirs(scene_dir)
-                new_target_pts, new_target_normals, new_scan_points_indices = RenderUtil.render_pts(pred_pose, scene_path, self.script_path, scan_points, voxel_threshold=voxel_threshold, filter_degree=filter_degree, nO_to_nL_pose=O_to_L_pose)
+            # pred_9d_path = os.path.join(scene_dir,f"pred_pose_9d_{len(pred_cr_seq)}.npy")
            # pts_path = os.path.join(scene_dir,f"combined_scanned_pts_{len(pred_cr_seq)}.txt")
            # np_combined_scanned_pts = input_data["combined_scanned_pts"][0].cpu().numpy()
            # np.save(pred_9d_path, pred_pose_9d.cpu().numpy())
            # np.savetxt(pts_path, np_combined_scanned_pts)
            # # ----- ----- -----
            predict_result = PredictResult(pred_pose_9d.cpu().numpy(), input_pts=input_data["combined_scanned_pts"][0].cpu().numpy(), cluster_params=dict(eps=0.25, min_samples=3))
            # -----------------------
            # import ipdb; ipdb.set_trace()
            # predict_result.visualize()
            # -----------------------
            pred_pose_9d_candidates = predict_result.candidate_9d_poses
            for pred_pose_9d in pred_pose_9d_candidates:
                #import ipdb; ipdb.set_trace()
-                if not ReconstructionUtil.check_scan_points_overlap(history_indices, new_scan_points_indices, scan_points_threshold):
+                pred_pose_9d = torch.tensor(pred_pose_9d, dtype=torch.float32).to(self.device).unsqueeze(0)
-                    curr_overlap_area_threshold = overlap_area_threshold
+                pred_pose[:3,:3] = PoseUtil.rotation_6d_to_matrix_tensor_batch(pred_pose_9d[:,:6])[0]
-                else:
+                pred_pose[:3,3] = pred_pose_9d[0,6:]
-                    curr_overlap_area_threshold = overlap_area_threshold * 0.5  
+                try:
                    new_target_pts, new_target_normals, new_scan_points_indices = RenderUtil.render_pts(pred_pose, scene_path, self.script_path, scan_points, voxel_threshold=voxel_threshold, filter_degree=filter_degree, nO_to_nL_pose=O_to_L_pose)
                    #import ipdb; ipdb.set_trace()
                    if not ReconstructionUtil.check_scan_points_overlap(history_indices, new_scan_points_indices, scan_points_threshold):
                        curr_overlap_area_threshold = overlap_area_threshold
                    else:
                        curr_overlap_area_threshold = overlap_area_threshold * 0.5  
-                downsampled_new_target_pts = PtsUtil.voxel_downsample_point_cloud(new_target_pts, voxel_threshold)
+                    downsampled_new_target_pts = PtsUtil.voxel_downsample_point_cloud(new_target_pts, voxel_threshold)
-                overlap, _ = ReconstructionUtil.check_overlap(downsampled_new_target_pts, voxel_downsampled_combined_scanned_pts_np, overlap_area_threshold = curr_overlap_area_threshold, voxel_size=voxel_threshold, require_new_added_pts_num = True)
+                    overlap, _ = ReconstructionUtil.check_overlap(downsampled_new_target_pts, voxel_downsampled_combined_scanned_pts_np, overlap_area_threshold = curr_overlap_area_threshold, voxel_size=voxel_threshold, require_new_added_pts_num = True)
-                if not overlap:
+                    if not overlap:
-                    Log.yellow("no overlap!")
+                        Log.yellow("no overlap!")
                        retry += 1
                        retry_overlap_pose.append(pred_pose.cpu().numpy().tolist())
                        continue
                    history_indices.append(new_scan_points_indices)
                except Exception as e:
                    Log.error(f"Error in scene {scene_path}, {e}")
                    print("current pose: ", pred_pose)
                    print("curr_pred_cr: ", last_pred_cr)
                    retry_no_pts_pose.append(pred_pose.cpu().numpy().tolist())
                    retry += 1
                    retry_overlap_pose.append(pred_pose.cpu().numpy().tolist())
                    continue
-                history_indices.append(new_scan_points_indices)
+                if new_target_pts.shape[0] == 0:
-            except Exception as e:
+                    Log.red("no pts in new target")
-                Log.error(f"Error in scene {scene_path}, {e}")
+                    retry_no_pts_pose.append(pred_pose.cpu().numpy().tolist())
-                print("current pose: ", pred_pose)
+                    retry += 1
-                print("curr_pred_cr: ", last_pred_cr)
+                    continue
                retry_no_pts_pose.append(pred_pose.cpu().numpy().tolist())
                retry += 1
                continue
            if new_target_pts.shape[0] == 0:
                Log.red("no pts in new target")
                retry_no_pts_pose.append(pred_pose.cpu().numpy().tolist())
                retry += 1
                continue
            pred_cr, _ = self.compute_coverage_rate(scanned_view_pts, new_target_pts, down_sampled_model_pts, threshold=voxel_threshold)
            Log.yellow(f"{pred_cr}, {last_pred_cr}, max: , {data['seq_max_coverage_rate']}")
            if pred_cr >= data["seq_max_coverage_rate"] - 1e-3:
                print("max coverage rate reached!: ", pred_cr)
-        
+                pred_cr, _ = self.compute_coverage_rate(scanned_view_pts, new_target_pts, down_sampled_model_pts, threshold=voxel_threshold)
-
+                Log.yellow(f"{pred_cr}, {last_pred_cr}, max: , {data['seq_max_coverage_rate']}")
-            pred_cr_seq.append(pred_cr)
+                if pred_cr >= data["seq_max_coverage_rate"] - 1e-3:
-            scanned_view_pts.append(new_target_pts)
+                    print("max coverage rate reached!: ", pred_cr)
            input_data["scanned_n_to_world_pose_9d"] = [torch.cat([input_data["scanned_n_to_world_pose_9d"][0], pred_pose_9d], dim=0)]
            combined_scanned_pts = np.vstack(scanned_view_pts)
            voxel_downsampled_combined_scanned_pts_np = PtsUtil.voxel_downsample_point_cloud(combined_scanned_pts, voxel_threshold)
            random_downsampled_combined_scanned_pts_np = PtsUtil.random_downsample_point_cloud(voxel_downsampled_combined_scanned_pts_np, input_pts_N)
            input_data["combined_scanned_pts"] = torch.tensor(random_downsampled_combined_scanned_pts_np, dtype=torch.float32).unsqueeze(0).to(self.device)
-            
+                pred_cr_seq.append(pred_cr)
-            last_pred_cr = pred_cr
+                scanned_view_pts.append(new_target_pts)
-            pts_num = voxel_downsampled_combined_scanned_pts_np.shape[0]
+                
-            Log.info(f"delta pts num:,{pts_num - last_pts_num },{pts_num}, {last_pts_num}")
+                input_data["scanned_n_to_world_pose_9d"] = [torch.cat([input_data["scanned_n_to_world_pose_9d"][0], pred_pose_9d], dim=0)]
                combined_scanned_pts = np.vstack(scanned_view_pts)
                voxel_downsampled_combined_scanned_pts_np = PtsUtil.voxel_downsample_point_cloud(combined_scanned_pts, voxel_threshold)
                random_downsampled_combined_scanned_pts_np = PtsUtil.random_downsample_point_cloud(voxel_downsampled_combined_scanned_pts_np, input_pts_N)
                input_data["combined_scanned_pts"] = torch.tensor(random_downsampled_combined_scanned_pts_np, dtype=torch.float32).unsqueeze(0).to(self.device)
-            if pts_num - last_pts_num < self.min_new_pts_num and pred_cr <= data["seq_max_coverage_rate"] - 1e-2:
+                
-                retry += 1
+                last_pred_cr = pred_cr
-                retry_duplication_pose.append(pred_pose.cpu().numpy().tolist())
+                pts_num = voxel_downsampled_combined_scanned_pts_np.shape[0]
-                Log.red(f"delta pts num < {self.min_new_pts_num}:, {pts_num}, {last_pts_num}")
+                Log.info(f"delta pts num:,{pts_num - last_pts_num },{pts_num}, {last_pts_num}")
            elif pts_num - last_pts_num < self.min_new_pts_num and pred_cr > data["seq_max_coverage_rate"] - 1e-2:
                success += 1
                Log.success(f"delta pts num < {self.min_new_pts_num}:, {pts_num}, {last_pts_num}")
-            last_pts_num = pts_num
+                if pts_num - last_pts_num < self.min_new_pts_num and pred_cr <= data["seq_max_coverage_rate"] - 1e-2:
                    retry += 1
                    retry_duplication_pose.append(pred_pose.cpu().numpy().tolist())
                    Log.red(f"delta pts num < {self.min_new_pts_num}:, {pts_num}, {last_pts_num}")
                elif pts_num - last_pts_num < self.min_new_pts_num and pred_cr > data["seq_max_coverage_rate"] - 1e-2:
                    success += 1
                    Log.success(f"delta pts num < {self.min_new_pts_num}:, {pts_num}, {last_pts_num}")
                last_pts_num = pts_num
        input_data["scanned_n_to_world_pose_9d"] = input_data["scanned_n_to_world_pose_9d"][0].cpu().numpy().tolist()
--- a/runners/simulator.py
+++ b/runners/simulator.py
@@ -0,0 +1,456 @@
 import pybullet as p
 import pybullet_data
 import numpy as np
 import os
 import time
 from PytorchBoot.runners.runner import Runner
 import PytorchBoot.stereotype as stereotype
 from PytorchBoot.config import ConfigManager
 from utils.control import ControlUtil
@stereotype.runner("simulator")
 class Simulator(Runner):
    CREATE: str = "create"
    SIMULATE: str = "simulate"
    INIT_GRIPPER_POSE:np.ndarray = np.asarray(
        [[0.41869126  ,0.87596275 , 0.23951774 , 0.36005292],
        [ 0.70787907 ,-0.4800251  , 0.51813998 ,-0.40499909],
        [ 0.56884584, -0.04739109 ,-0.82107382  ,0.76881103],
        [ 0.         , 0.    ,      0.      ,    1.        ]])
    TURNTABLE_WORLD_TO_PYBULLET_WORLD:np.ndarray = np.asarray(
        [[1, 0, 0, 0.8],
        [0, 1, 0, 0],
        [0, 0, 1, 0.5],
        [0, 0, 0, 1]])
    debug_pose = np.asarray([
        [
            0.992167055606842,
            -0.10552699863910675,
            0.06684812903404236,
            -0.07388903945684433
        ],
        [
            0.10134342312812805,
            0.3670985698699951,
            -0.9246448874473572,
            -0.41582486033439636
        ],
        [
            0.07303514331579208,
            0.9241767525672913,
            0.37491756677627563,
            1.0754833221435547
        ],
        [
            0.0,
            0.0,
            0.0,
            1.0
        ]])
    def __init__(self, config_path):
        super().__init__(config_path)
        self.config_path = config_path
        self.robot_id = None
        self.turntable_id = None
        self.target_id = None
        camera_config = ConfigManager.get("simulation", "camera")
        self.camera_params = {
            'width': camera_config["width"],
            'height': camera_config["height"],
            'fov': camera_config["fov"],
            'near': camera_config["near"],
            'far': camera_config["far"]
        }
        self.sim_config = ConfigManager.get("simulation")
    def run(self, cmd):
        print(f"Simulator run {cmd}")
        if cmd == self.CREATE:
            self.prepare_env()
            self.create_env()
        elif cmd == self.SIMULATE:
            self.simulate()
    def simulate(self):
        self.reset()
        self.init()
        debug_pose = Simulator.debug_pose
        offset = np.asarray([[1, 0, 0, 0], [0, -1, 0, 0], [0, 0, -1, 0], [0, 0, 0, 1]])
        debug_pose = debug_pose @ offset
        for _ in range(10000):
            debug_pose_2 = np.eye(4)
            debug_pose_2[0,0] = -1
            debug_pose_2[2,3] = 0.5
            self.move_to(debug_pose_2)
            # Wait for the system to stabilize
            for _ in range(20):  # Simulate 20 steps to ensure stability
                p.stepSimulation()
                time.sleep(0.001)  # Add small delay to ensure physics simulation
            depth_img, segm_img = self.take_picture()
            p.stepSimulation()
    def prepare_env(self):
        p.connect(p.GUI)
        p.setAdditionalSearchPath(pybullet_data.getDataPath())
        p.setGravity(0, 0, 0)
        p.loadURDF("plane.urdf")
    def create_env(self):
        print(self.config)
        robot_config = self.sim_config["robot"]
        turntable_config = self.sim_config["turntable"]
        target_config = self.sim_config["target"]
        self.robot_id = p.loadURDF(
            robot_config["urdf_path"],
            robot_config["initial_position"],
            p.getQuaternionFromEuler(robot_config["initial_orientation"]),
            useFixedBase=True
        )
        p.changeDynamics(
            self.robot_id,
            linkIndex=-1,
            mass=0,
            linearDamping=0,
            angularDamping=0,
            lateralFriction=0
        )
        visual_shape_id = p.createVisualShape(
            shapeType=p.GEOM_CYLINDER,
            radius=turntable_config["radius"],
            length=turntable_config["height"],
            rgbaColor=[0.7, 0.7, 0.7, 1]
        )
        collision_shape_id = p.createCollisionShape(
            shapeType=p.GEOM_CYLINDER,
            radius=turntable_config["radius"],
            height=turntable_config["height"]
        )
        self.turntable_id = p.createMultiBody(
            baseMass=0,  # 设置质量为0使其成为静态物体
            baseCollisionShapeIndex=collision_shape_id,
            baseVisualShapeIndex=visual_shape_id,
            basePosition=turntable_config["center_position"]
        )
        # 禁用转盘的动力学
        p.changeDynamics(
            self.turntable_id,
            -1,  # -1 表示基座
            mass=0,
            linearDamping=0,
            angularDamping=0,
            lateralFriction=0
        )
        obj_path = os.path.join(target_config["obj_dir"], target_config["obj_name"], "mesh.obj")
        assert os.path.exists(obj_path), f"Error: File not found at {obj_path}"
        # 加载OBJ文件作为目标物体
        target_visual = p.createVisualShape(
            shapeType=p.GEOM_MESH,
            fileName=obj_path,
            rgbaColor=target_config["rgba_color"],
            specularColor=[0.4, 0.4, 0.4],
            meshScale=[target_config["scale"]] * 3
        )
        # 使用简化的碰撞形状
        target_collision = p.createCollisionShape(
            shapeType=p.GEOM_MESH,
            fileName=obj_path,
            meshScale=[target_config["scale"]] * 3,
            flags=p.GEOM_FORCE_CONCAVE_TRIMESH  # 尝试使用凹面网格
        )
        # 创建目标物体
        self.target_id = p.createMultiBody(
            baseMass=0,  # 设置质量为0使其成为静态物体
            baseCollisionShapeIndex=target_collision,
            baseVisualShapeIndex=target_visual,
            basePosition=[
                turntable_config["center_position"][0],
                turntable_config["center_position"][1],
                turntable_config["height"] + turntable_config["center_position"][2]
            ],
            baseOrientation=p.getQuaternionFromEuler([np.pi/2, 0, 0])
        )
        # 禁用目标物体的动力学
        p.changeDynamics(
            self.target_id,
            -1,  # -1 表示基座
            mass=0,
            linearDamping=0,
            angularDamping=0,
            lateralFriction=0
        )
        # 创建固定约束，将目标物体固定在转盘上
        cid = p.createConstraint(
            parentBodyUniqueId=self.turntable_id,
            parentLinkIndex=-1,  # -1 表示基座
            childBodyUniqueId=self.target_id,
            childLinkIndex=-1,  # -1 表示基座
            jointType=p.JOINT_FIXED,
            jointAxis=[0, 0, 0],
            parentFramePosition=[0, 0, 0],  # 相对于转盘中心的偏移
            childFramePosition=[0, 0, 0]  # 相对于物体中心的偏移
        )
        # 设置约束参数
        p.changeConstraint(cid, maxForce=100)  # 设置最大力，确保约束稳定
    def move_robot_to_pose(self, target_matrix):
        # 从4x4齐次矩阵中提取位置（前3个元素）
        position = target_matrix[:3, 3]
        # 从3x3旋转矩阵中提取方向四元数
        R = target_matrix[:3, :3]
        # 计算四元数的w分量
        w = np.sqrt(max(0, 1 + R[0,0] + R[1,1] + R[2,2])) / 2
        # 避免除零错误，同时处理不同情况
        if abs(w) < 1e-8:
            # 当w接近0时的特殊情况
            x = np.sqrt(max(0, 1 + R[0,0] - R[1,1] - R[2,2])) / 2
            y = np.sqrt(max(0, 1 - R[0,0] + R[1,1] - R[2,2])) / 2
            z = np.sqrt(max(0, 1 - R[0,0] - R[1,1] + R[2,2])) / 2
            # 确定符号
            if R[2,1] - R[1,2] < 0: x = -x
            if R[0,2] - R[2,0] < 0: y = -y
            if R[1,0] - R[0,1] < 0: z = -z
        else:
            # 正常情况
            x = (R[2,1] - R[1,2]) / (4 * w)
            y = (R[0,2] - R[2,0]) / (4 * w)
            z = (R[1,0] - R[0,1]) / (4 * w)
        orientation = (x, y, z, w)
        # 设置IK求解参数
        num_joints = p.getNumJoints(self.robot_id)
        lower_limits = []
        upper_limits = []
        joint_ranges = []
        rest_poses = []
        # 获取关节限制和默认姿态
        for i in range(num_joints):
            joint_info = p.getJointInfo(self.robot_id, i)
            lower_limits.append(joint_info[8])
            upper_limits.append(joint_info[9])
            joint_ranges.append(joint_info[9] - joint_info[8])
            rest_poses.append(0)  # 可以设置一个较好的默认姿态
        # 使用增强版IK求解器，考虑碰撞避障
        joint_poses = p.calculateInverseKinematics(
            self.robot_id,
            7,  # end effector link index
            position,
            orientation,
            lowerLimits=lower_limits,
            upperLimits=upper_limits,
            jointRanges=joint_ranges,
            restPoses=rest_poses,
            maxNumIterations=100,
            residualThreshold=1e-4
        )
        # 分步移动到目标位置，同时检查碰撞
        current_poses = [p.getJointState(self.robot_id, i)[0] for i in range(7)]
        steps = 50  # 分50步移动
        for step in range(steps):
            # 线性插值计算中间位置
            intermediate_poses = []
            for current, target in zip(current_poses, joint_poses):
                t = (step + 1) / steps
                intermediate = current + (target - current) * t
                intermediate_poses.append(intermediate)
            # 设置关节位置
            for i in range(7):
                p.setJointMotorControl2(
                    self.robot_id,
                    i,
                    p.POSITION_CONTROL,
                    intermediate_poses[i]
                )
            # 执行一步模拟
            p.stepSimulation()
            # 检查碰撞
            if p.getContactPoints(self.robot_id, self.turntable_id):
                print("检测到潜在碰撞，停止移动")
                return False
        return True
    def rotate_turntable(self, angle_degrees):
        # 旋转转盘
        current_pos, current_orn = p.getBasePositionAndOrientation(self.turntable_id)
        current_orn = p.getEulerFromQuaternion(current_orn)
        new_orn = list(current_orn)
        new_orn[2] += np.radians(angle_degrees)
        new_orn_quat = p.getQuaternionFromEuler(new_orn)
        p.resetBasePositionAndOrientation(
            self.turntable_id,
            current_pos,
            new_orn_quat
        )
        # 同时旋转目标物体
        target_pos, target_orn = p.getBasePositionAndOrientation(self.target_id)
        target_orn = p.getEulerFromQuaternion(target_orn)
        # 更新目标物体的方向
        target_orn = list(target_orn)
        target_orn[2] += np.radians(angle_degrees)
        target_orn_quat = p.getQuaternionFromEuler(target_orn)
        # 计算物体新的位置（绕转盘中心旋转）
        turntable_center = current_pos
        relative_pos = np.array(target_pos) - np.array(turntable_center)
        # 创建旋转矩阵
        theta = np.radians(angle_degrees)
        rotation_matrix = np.array([
            [np.cos(theta), -np.sin(theta), 0],
            [np.sin(theta), np.cos(theta), 0],
            [0, 0, 1]
        ])
        # 计算新的相对位置
        new_relative_pos = rotation_matrix.dot(relative_pos)
        new_pos = np.array(turntable_center) + new_relative_pos
        # 更新目标物体的位置和方向
        p.resetBasePositionAndOrientation(
            self.target_id,
            new_pos,
            target_orn_quat
        )
    def get_camera_pose(self):
        end_effector_link = 7  # Franka末端执行器的链接索引
        state = p.getLinkState(self.robot_id, end_effector_link)
        ee_pos = state[0]  # 世界坐标系中的位置
        camera_orn = state[1]  # 世界坐标系中的朝向（四元数）
        # 计算相机的视角矩阵
        rot_matrix = p.getMatrixFromQuaternion(camera_orn)
        rot_matrix = np.array(rot_matrix).reshape(3, 3)
        # 相机的前向向量（与末端执行器的x轴对齐）
        camera_forward = rot_matrix.dot(np.array([0, 0, 1]))  # x轴方向
        # 将相机位置向前偏移0.1米
        offset = 0.12
        camera_pos = np.array(ee_pos) + camera_forward * offset
        camera_target = camera_pos + camera_forward
        # 相机的上向量（与末端执行器的z轴对齐）
        camera_up = rot_matrix.dot(np.array([1, 0, 0]))  # z轴方向
        return camera_pos, camera_target, camera_up
    def take_picture(self):
        camera_pos, camera_target, camera_up = self.get_camera_pose()
        view_matrix = p.computeViewMatrix(
            cameraEyePosition=camera_pos,
            cameraTargetPosition=camera_target,
            cameraUpVector=camera_up
        )
        projection_matrix = p.computeProjectionMatrixFOV(
            fov=self.camera_params['fov'],
            aspect=self.camera_params['width'] / self.camera_params['height'],
            nearVal=self.camera_params['near'],
            farVal=self.camera_params['far']
        )
        _,_,rgb_img,depth_img,segm_img = p.getCameraImage(
            width=self.camera_params['width'],
            height=self.camera_params['height'],
            viewMatrix=view_matrix,
            projectionMatrix=projection_matrix,
            renderer=p.ER_BULLET_HARDWARE_OPENGL
        )
        depth_img = self.camera_params['far'] * self.camera_params['near'] / (
            self.camera_params['far'] - (self.camera_params['far'] - self.camera_params['near']) * depth_img)
        depth_img = np.array(depth_img)
        segm_img = np.array(segm_img)
        return depth_img, segm_img
    def reset(self):
        target_pos = [0.5, 0, 1]
        target_orn = p.getQuaternionFromEuler([np.pi, 0, 0])
        target_matrix = np.eye(4)
        target_matrix[:3, 3] = target_pos
        target_matrix[:3, :3] = np.asarray(p.getMatrixFromQuaternion(target_orn)).reshape(3,3)
        self.move_robot_to_pose(target_matrix)
    def init(self):
        self.move_to(Simulator.INIT_GRIPPER_POSE)
    def move_to(self, pose: np.ndarray):
        #delta_degree, min_new_cam_to_world = ControlUtil.solve_display_table_rot_and_cam_to_world(pose)
        #print(delta_degree)
        min_new_cam_to_pybullet_world = Simulator.TURNTABLE_WORLD_TO_PYBULLET_WORLD@pose
        self.move_to_cam_pose(min_new_cam_to_pybullet_world)
        #self.rotate_turntable(delta_degree)
    def __del__(self):
        p.disconnect()
    def create_experiment(self, backup_name=None):
        return super().create_experiment(backup_name)
    def load_experiment(self, backup_name=None):
        super().load_experiment(backup_name)
    def move_to_cam_pose(self, camera_pose: np.ndarray):
        # 从相机位姿矩阵中提取位置和旋转矩阵
        camera_pos = camera_pose[:3, 3]
        R_camera = camera_pose[:3, :3]
        # 相机的朝向向量（z轴）
        forward = R_camera[:, 2]
        # 由于相机与末端执行器之间有固定偏移，需要计算末端执行器位置
        # 相机在末端执行器前方0.12米
        gripper_pos = camera_pos - forward * 0.12
        # 末端执行器的旋转矩阵需要考虑与相机坐标系的固定变换
        # 假设相机的forward对应gripper的z轴，相机的x轴对应gripper的x轴
        R_gripper = R_camera
        # 构建4x4齐次变换矩阵
        gripper_pose = np.eye(4)
        gripper_pose[:3, :3] = R_gripper
        gripper_pose[:3, 3] = gripper_pos
        print(gripper_pose)
        # 移动机器人到计算出的位姿
        return self.move_robot_to_pose(gripper_pose)
--- a/utils/control.py
+++ b/utils/control.py
@@ -0,0 +1,59 @@
 import numpy as np
 from scipy.spatial.transform import Rotation as R
 import time
 class ControlUtil:
    curr_rotation = 0
    @staticmethod
    def check_limit(new_cam_to_world):
        if new_cam_to_world[0,3] < 0 or new_cam_to_world[1,3] > 0:
        # if new_cam_to_world[0,3] > 0:
            return False
        x = abs(new_cam_to_world[0,3])
        y = abs(new_cam_to_world[1,3])
        tan_y_x = y/x
        min_angle = 0 / 180 * np.pi
        max_angle = 90 / 180 * np.pi
        if tan_y_x < np.tan(min_angle) or tan_y_x > np.tan(max_angle):
            return False
        return True
    @staticmethod
    def solve_display_table_rot_and_cam_to_world(cam_to_world: np.ndarray) -> tuple:   
        if ControlUtil.check_limit(cam_to_world):
            return 0, cam_to_world
        else:
            min_display_table_rot = 180
            min_new_cam_to_world = None
            for display_table_rot in np.linspace(0.1,360, 1800):
                new_world_to_world = ControlUtil.get_z_axis_rot_mat(display_table_rot)
                new_cam_to_new_world = cam_to_world
                new_cam_to_world = new_world_to_world @ new_cam_to_new_world
                if ControlUtil.check_limit(new_cam_to_world):
                    if display_table_rot < min_display_table_rot:
                        min_display_table_rot, min_new_cam_to_world = display_table_rot, new_cam_to_world
                    if abs(display_table_rot - 360) < min_display_table_rot:
                        min_display_table_rot, min_new_cam_to_world = display_table_rot - 360, new_cam_to_world
        if min_new_cam_to_world is None:
            raise ValueError("No valid display table rotation found")
        delta_degree = min_display_table_rot - ControlUtil.curr_rotation
        ControlUtil.curr_rotation = min_display_table_rot
        return delta_degree, min_new_cam_to_world
    @staticmethod
    def get_z_axis_rot_mat(degree):
        radian = np.radians(degree)
        return np.array([
            [np.cos(radian), -np.sin(radian), 0, 0],
            [np.sin(radian), np.cos(radian), 0, 0],
            [0, 0, 1, 0],
            [0, 0, 0, 1]
            ])
--- a/utils/render.py
+++ b/utils/render.py
@@ -70,7 +70,7 @@ class RenderUtil:
    @staticmethod
    def render_pts(cam_pose, scene_path, script_path, scan_points, voxel_threshold=0.005, filter_degree=75, nO_to_nL_pose=None, require_full_scene=False):
-        
+        import ipdb; ipdb.set_trace()
        nO_to_world_pose = DataLoadUtil.get_real_cam_O_from_cam_L(cam_pose, nO_to_nL_pose, scene_path=scene_path)
@@ -88,6 +88,7 @@ class RenderUtil:
                '/home/hofee/blender-4.0.2-linux-x64/blender', '-b', '-P', script_path, '--', temp_dir
            ], capture_output=True, text=True)
            #print(result)
            #import ipdb; ipdb.set_trace()
            path = os.path.join(temp_dir, "tmp")
            cam_info = DataLoadUtil.load_cam_info(path, binocular=True)
            depth_L, depth_R = DataLoadUtil.load_depth(
--- a/utils/vis.py
+++ b/utils/vis.py
@@ -7,6 +7,7 @@ import trimesh
 sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 from utils.data_load import DataLoadUtil
 from utils.pts import PtsUtil
 from utils.pose import PoseUtil
 class visualizeUtil:
@@ -33,7 +34,22 @@ class visualizeUtil:
        all_cam_axis = np.array(all_cam_axis).reshape(-1, 3)
        np.savetxt(os.path.join(output_dir, "all_cam_pos.txt"), all_cam_pos)
        np.savetxt(os.path.join(output_dir, "all_cam_axis.txt"), all_cam_axis)
-        
+    
    @staticmethod
    def get_cam_pose_and_cam_axis(cam_pose, is_6d_pose):
        if is_6d_pose:
            matrix_cam_pose = np.eye(4)
            matrix_cam_pose[:3,:3] = PoseUtil.rotation_6d_to_matrix_numpy(cam_pose[:6])
            matrix_cam_pose[:3, 3] = cam_pose[6:]
        else:
            matrix_cam_pose = cam_pose
        cam_pos = matrix_cam_pose[:3, 3]
        cam_axis = matrix_cam_pose[:3, 2]
        num_samples = 10
        sample_points = [cam_pos + 0.02*t * cam_axis for t in range(num_samples)]
        sample_points = np.array(sample_points)
        return cam_pos, sample_points
    @staticmethod
    def save_all_combined_pts(root, scene, output_dir):
        length = DataLoadUtil.get_scene_seq_length(root, scene)
Author	SHA1	Message	Date
hofee	1a0e3c8042	sim control	2025-04-09 15:17:24 +08:00
hofee	2fcc650eb7	solve conflicts	2025-03-13 14:49:35 +08:00
hofee	b20fa8bb75	update strong pointnet++	2025-03-13 14:48:15 +08:00
hofee	d7fb64ed13	update strong p++	2025-01-23 08:58:10 +00:00
hofee	5a03659112	update inference server	2025-01-07 19:32:02 +08:00
hofee	fca984e76b	Merge branch 'ab_global_only' of http://git.hofee.top/hofee/nbv_reconstruction into ab_global_only	2025-01-05 23:57:43 +08:00
hofee	dec67e8255	upd inference	2025-01-05 23:57:33 +08:00
hofee	9c2625b11e	upd	2024-12-31 02:52:46 +08:00
hofee	2dfb6c57ce	upd	2024-12-31 02:51:42 +08:00