Spaces:

cyun9286
/

Align3R

Running

App Files Files Community

cyun9286 commited on Dec 13, 2024

Commit

748a455

1 Parent(s): a779ffd

1

Browse files

Files changed (4) hide show

app.py +2 -7
croco/models/__pycache__/pos_embed.cpython-311.pyc +0 -0
third_party/RAFT/core/__pycache__/extractor.cpython-311.pyc +0 -0
third_party/RAFT/core/extractor.py +1 -1

app.py CHANGED Viewed

@@ -116,6 +116,7 @@ def generate_monocular_depth_maps(img_list, depth_prior_name):
           depth = pipe(image)["predicted_depth"].numpy()
           depth = cv2.resize(depth[0], image.size, interpolation=cv2.INTER_LANCZOS4)
           focallength_px = 200
           depth_list.append(depth)
           focallength_px_list.append(focallength_px)
           #np.savez_compressed(path_depthanything, depth=depth)
@@ -138,6 +139,7 @@ def local_get_reconstructed_scene(filelist, min_conf_thr, as_pointcloud, mask_sk
     model = AsymmetricCroCo3DStereo.from_pretrained(weights_path).to(device)
     output = inference(pairs, model, device, batch_size=batch_size, verbose=not silent)
     mode = GlobalAlignerMode.PointCloudOptimizer
     scene = global_aligner(output, device=device, mode=mode, verbose=not silent, shared_focal = True, temporal_smoothing_weight=0.01, translation_weight=1.0,
                                flow_loss_weight=0.01, flow_loss_start_epoch=0.1, flow_loss_thre=25, use_self_mask=True,
                                num_total_iter=300, empty_cache= len(filelist) > 72)
@@ -192,13 +194,6 @@ with gradio.Blocks(css=css, title=title, delete_cache=(gradio_delete_cache, grad
                      [os.path.join(HERE_PATH, 'example/bear/00000.jpg'),
                       os.path.join(HERE_PATH, 'example/bear/00001.jpg'),
                       os.path.join(HERE_PATH, 'example/bear/00002.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00003.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00004.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00005.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00006.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00007.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00008.jpg'),
-                      os.path.join(HERE_PATH, 'example/bear/00009.jpg'),
                       ]
                 ],
                 [

           depth = pipe(image)["predicted_depth"].numpy()
           depth = cv2.resize(depth[0], image.size, interpolation=cv2.INTER_LANCZOS4)
           focallength_px = 200
+          print(depth.max(),depth.min())
           depth_list.append(depth)
           focallength_px_list.append(focallength_px)
           #np.savez_compressed(path_depthanything, depth=depth)
     model = AsymmetricCroCo3DStereo.from_pretrained(weights_path).to(device)
     output = inference(pairs, model, device, batch_size=batch_size, verbose=not silent)
     mode = GlobalAlignerMode.PointCloudOptimizer
+    print(output)
     scene = global_aligner(output, device=device, mode=mode, verbose=not silent, shared_focal = True, temporal_smoothing_weight=0.01, translation_weight=1.0,
                                flow_loss_weight=0.01, flow_loss_start_epoch=0.1, flow_loss_thre=25, use_self_mask=True,
                                num_total_iter=300, empty_cache= len(filelist) > 72)
                      [os.path.join(HERE_PATH, 'example/bear/00000.jpg'),
                       os.path.join(HERE_PATH, 'example/bear/00001.jpg'),
                       os.path.join(HERE_PATH, 'example/bear/00002.jpg'),
                       ]
                 ],
                 [

croco/models/__pycache__/pos_embed.cpython-311.pyc CHANGED Viewed

Binary files a/croco/models/__pycache__/pos_embed.cpython-311.pyc and b/croco/models/__pycache__/pos_embed.cpython-311.pyc differ

third_party/RAFT/core/__pycache__/extractor.cpython-311.pyc CHANGED Viewed

Binary files a/third_party/RAFT/core/__pycache__/extractor.cpython-311.pyc and b/third_party/RAFT/core/__pycache__/extractor.cpython-311.pyc differ

third_party/RAFT/core/extractor.py CHANGED Viewed

@@ -312,7 +312,7 @@ class ResNetFPN(nn.Module):
                     nn.init.constant_(m.weight, 1)
                 if m.bias is not None:
                     nn.init.constant_(m.bias, 0)
         if self.init_weight:
             from torchvision.models import resnet18, ResNet18_Weights, resnet34, ResNet34_Weights
             if args.pretrain == 'resnet18':

                     nn.init.constant_(m.weight, 1)
                 if m.bias is not None:
                     nn.init.constant_(m.bias, 0)
+        #print('****',args.pretrain, self.init_weight)
         if self.init_weight:
             from torchvision.models import resnet18, ResNet18_Weights, resnet34, ResNet34_Weights
             if args.pretrain == 'resnet18':