krishauser
diff --git a/‎GEMstack/scripts/geotag_from_files.py‎ ‎…ffboard/geo_tagging/geotag_from_files.py‎GEMstack/scripts/geotag_from_files.py renamed to GEMstack/offboard/geo_tagging/geotag_from_files.py b/‎GEMstack/scripts/geotag_from_files.py‎ ‎…ffboard/geo_tagging/geotag_from_files.py‎GEMstack/scripts/geotag_from_files.py renamed to GEMstack/offboard/geo_tagging/geotag_from_files.py
diff --git a/‎GEMstack/scripts/geotag_from_rosbag.py‎ ‎…fboard/geo_tagging/geotag_from_rosbag.py‎GEMstack/scripts/geotag_from_rosbag.py renamed to GEMstack/offboard/geo_tagging/geotag_from_rosbag.py b/‎GEMstack/scripts/geotag_from_rosbag.py‎ ‎…fboard/geo_tagging/geotag_from_rosbag.py‎GEMstack/scripts/geotag_from_rosbag.py renamed to GEMstack/offboard/geo_tagging/geotag_from_rosbag.py
diff --git a/‎GEMstack/scripts/register_lidar_scans.py‎ ‎…oard/geo_tagging/register_lidar_scans.py‎GEMstack/scripts/register_lidar_scans.py renamed to GEMstack/offboard/geo_tagging/register_lidar_scans.py b/‎GEMstack/scripts/register_lidar_scans.py‎ ‎…oard/geo_tagging/register_lidar_scans.py‎GEMstack/scripts/register_lidar_scans.py renamed to GEMstack/offboard/geo_tagging/register_lidar_scans.py
diff --git a/‎GEMstack/offboard/mast3r_3d_reconstruction/mast3r_runner.py‎
Lines changed: 8 additions & 8 deletions b/‎GEMstack/offboard/mast3r_3d_reconstruction/mast3r_runner.py‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎GEMstack/offboard/mast3r_3d_reconstruction/scale_pointcloud_based_on_geotag.py‎
Lines changed: 44 additions & 36 deletions b/‎GEMstack/offboard/mast3r_3d_reconstruction/scale_pointcloud_based_on_geotag.py‎
Lines changed: 44 additions & 36 deletions
diff --git a/‎GEMstack/scripts/__init__.py‎ b/‎GEMstack/scripts/__init__.py‎
@@ -23,12 +23,12 @@
 from mast3r.retrieval.processor import Retriever
 
 import mast3r.utils.path_to_dust3r  # noqa
-from dust3r.dust3r.utils.geometry import inv, geotrf  # noqa
-from dust3r.dust3r.utils.image import load_images
-from dust3r.dust3r.utils.device import to_numpy
-from dust3r.dust3r.viz import add_scene_cam, CAM_COLORS, OPENGL, pts3d_to_trimesh, cat_meshes
-from dust3r.dust3r.demo import get_args_parser as dust3r_get_args_parser
-from dust3r.dust3r.cloud_opt.base_opt import clean_pointcloud
+from dust3r.utils.geometry import inv, geotrf  # noqa
+from dust3r.utils.image import load_images
+from dust3r.utils.device import to_numpy
+from dust3r.viz import add_scene_cam, CAM_COLORS, OPENGL, pts3d_to_trimesh, cat_meshes
+from dust3r.demo import get_args_parser as dust3r_get_args_parser
+from dust3r.cloud_opt.base_opt import clean_pointcloud
 
 import matplotlib.pyplot as pl
 import open3d as o3d
@@ -314,9 +314,9 @@ def convert_scene_output_to_ply_impl(outfile, imgs, pts3d, mask, scale=1.0, appl
     pcd = o3d.geometry.PointCloud()
     pcd.points = o3d.utility.Vector3dVector(all_pts)
     pcd.colors = o3d.utility.Vector3dVector(all_colors)
-
+    print('cwd', os.getcwd())
     # Save to .ply
-    o3d.io.write_point_cloud(outfile, pcd)
+    o3d.io.write_point_cloud(os.path.join(os.getcwd(), outfile), pcd)
     if not silent:
         print(f"✅ Exported scaled point cloud to: {outfile}")
 
 
@@ -2,8 +2,8 @@
 from itertools import combinations
 from pathlib import Path
 import numpy as np
-from mast3r.mast3r.model import AsymmetricMASt3R
-from mast3r.mast3r.utils.misc import hash_md5
+from mast3r.model import AsymmetricMASt3R
+from mast3r.utils.misc import hash_md5
 from pyproj import Transformer
 import numpy as np
 from PIL import Image
@@ -23,7 +23,7 @@
 import open3d as o3d
 from scipy.spatial.transform import Rotation
 
-from mast3r.mast3r.demo import get_args_parser, main_demo
+from mast3r.demo import get_args_parser, main_demo
 import argparse
 from mast3r_runner import get_reconstructed_scene, convert_scene_output_to_ply
 
@@ -238,34 +238,35 @@ def get_context(tmp_dir):
                                   args.scenegraph_type, args.winsize, args.win_cyclic, args.refid, 0, args.shared_intrinsics)
     return scene_state, outfile
 
-def add_parse_args(parser):
-    parser.add_argument('--folder_path', type=str, required=True)
-    parser.add_argument('--output_path', type=str, required=True)
-    parser.add_argument('--scale_method', type=str, required=True)
-
-    parser.add_argument('--weights_path', type=str, required=True, help='Path to the core mast3rweights file')
-    parser.add_argument('--retrieval_model', type=str, required=True, help='Retrieval model weights path that is used to make image pairs')
-    parser.add_argument('--device', type=str, required=True, help='Device to run the model on')
-    parser.add_argument('--silent', type=bool, required=True, help='Whether to run the model silently')
-    parser.add_argument('--image_size', type=int, required=True, help='Image size')
-    parser.add_argument('--optim_level', type=int, required=True, help='Optimization level')
-    parser.add_argument('--lr1', type=float, required=True, help='Learning rate for the first refinement iteration stage')
-    parser.add_argument('--niter1', type=int, required=True, help='Number of iterations for the first refinement iteration stage')
-    parser.add_argument('--lr2', type=float, required=True, help='Learning rate for the second refinement iteration stage')
-    parser.add_argument('--niter2', type=int, required=True, help='Number of iterations for the second refinement iteration stage')
-    parser.add_argument('--min_conf_thr', type=float, required=True, help='Minimum confidence threshold')
-    parser.add_argument('--matching_conf_thr', type=float, required=True, help='Matching confidence threshold')
-    # parser.add_argument('--as_pointcloud', type=bool, required=True, help='Whether to output a pointcloud')
-    # parser.add_argument('--mask_sky', type=bool, required=True, help='Whether to mask the sky')
-    parser.add_argument('--clean_depth', type=bool, required=True, help='Whether to clean the depth')
-    parser.add_argument('--transparent_cams', type=bool, required=True, help='Whether to make the cameras transparent')
-    parser.add_argument('--cam_size', type=float, required=True, help='Camera size')
-    parser.add_argument('--scenegraph_type', type=str, required=True, help='Scenegraph type')
-    parser.add_argument('--winsize', type=int, required=True, help='Window size for sliding window pair making scenegraph_type')
-    parser.add_argument('--win_cyclic', type=bool, required=True, help='Whether to use a cyclic sliding window')
-    parser.add_argument('--refid', type=str, required=True, help='Reference image for retrieval')
-    # parser.add_argument('--TSDF_thresh', type=float, required=True, help='TSDF refinement threshold')
-    parser.add_argument('--shared_intrinsics', type=bool, required=True, help='Whether to use a shared intrinsics model')
+def add_parse_args(parser, is_scene_path=False):
+    parser.add_argument('--folder_path', type=str, required=True, help='Path to the folder containing the images')
+    parser.add_argument('--output_path', type=str, required=True, help='Path to the output file')
+    parser.add_argument('--scale_method', type=str, required=True, help='Method to use for scale estimation')
+    parser.add_argument('--scene_path', type=str, required=False, help='Path to the scene file')
+    if not is_scene_path:
+        parser.add_argument('--weights_path', type=str, required=True, help='Path to the core mast3rweights file')
+        # parser.add_argument('--retrieval_model', type=str, required=True, help='Retrieval model weights path that is used to make image pairs')
+        # parser.add_argument('--device', type=str, required=True, help='Device to run the model on')
+        # parser.add_argument('--silent', type=bool, required=True, help='Whether to run the model silently')
+        # parser.add_argument('--image_size', type=int, required=True, help='Image size')
+        parser.add_argument('--optim_level', type=int, required=True, help='Optimization level')
+        parser.add_argument('--lr1', type=float, required=True, help='Learning rate for the first refinement iteration stage')
+        parser.add_argument('--niter1', type=int, required=True, help='Number of iterations for the first refinement iteration stage')
+        parser.add_argument('--lr2', type=float, required=True, help='Learning rate for the second refinement iteration stage')
+        parser.add_argument('--niter2', type=int, required=True, help='Number of iterations for the second refinement iteration stage')
+        parser.add_argument('--min_conf_thr', type=float, required=True, help='Minimum confidence threshold')
+        parser.add_argument('--matching_conf_thr', type=float, required=True, help='Matching confidence threshold')
+        # parser.add_argument('--as_pointcloud', type=bool, required=True, help='Whether to output a pointcloud')
+        # parser.add_argument('--mask_sky', type=bool, required=True, help='Whether to mask the sky')
+        parser.add_argument('--clean_depth', type=bool, required=True, help='Whether to clean the depth')
+        parser.add_argument('--transparent_cams', type=bool, required=True, help='Whether to make the cameras transparent')
+        parser.add_argument('--cam_size', type=float, required=True, help='Camera size')
+        parser.add_argument('--scenegraph_type', type=str, required=True, help='Scenegraph type')
+        parser.add_argument('--winsize', type=int, required=True, help='Window size for sliding window pair making scenegraph_type')
+        parser.add_argument('--win_cyclic', type=bool, required=True, help='Whether to use a cyclic sliding window')
+        parser.add_argument('--refid', type=str, required=True, help='Reference image for retrieval')
+        # parser.add_argument('--TSDF_thresh', type=float, required=True, help='TSDF refinement threshold')
+        parser.add_argument('--shared_intrinsics', type=bool, required=True, help='Whether to use a shared intrinsics model')
 
 
     return parser
@@ -281,16 +282,16 @@ def scale_pointcloud_based_on_geotag():
 
     if not args.scene_path:
         args_parser = get_args_parser()
-        args_parser = add_parse_args(args_parser)
+        args_parser = add_parse_args(args_parser, is_scene_path=False)
         args = args_parser.parse_args()
         scene, outfile = run_mast3r(args)
         scene.get_dense_pts3d()
         data = scene
     else:
         args_parser = argparse.ArgumentParser()
-        args_parser = add_parse_args(args_parser)
+        args_parser = add_parse_args(args_parser, is_scene_path=True)
         args = args_parser.parse_args()
-    
+        print('cwd', os.getcwd())
         with open(args.scene_path, 'rb') as f:
                     data = pickle.load(f)
 
@@ -305,11 +306,18 @@ def scale_pointcloud_based_on_geotag():
     }
     image_names = extract_image_names(data.img_paths)
     xyz_lookup = gps_to_xyz(gps_lookup)
+    scale = 1.0
     for method in ['ransac', 'median']:
         if method == 'ransac':
-            scale, sfm_dists, gps_dists = estimate_scale_ransac(camera_centers, xyz_lookup, image_names)
+            # print('camera_centers', camera_centers, )
+            # print('xyz_lookup', xyz_lookup)
+            # print('image_names', image_names)
+            scale, sfm_dists, gps_dists = estimate_scale_ransac(camera_centers.cpu().numpy(), xyz_lookup, image_names)
+            print('scale', scale)
+            print('sfm_dists', sfm_dists)
+            print('gps_dists', gps_dists)
         else:
-            scale, sfm_dists, gps_dists = estimate_3d_scale_from_gps(camera_centers, xyz_lookup, image_names)
+            scale, sfm_dists, gps_dists = estimate_3d_scale_from_gps(camera_centers.cpu().numpy(), xyz_lookup, image_names)
         print(f"Estimated scale: {scale}")
     convert_scene_output_to_ply(args.output_path, data, scale=scale, apply_y_flip=False)