Python-Depth-Est-AV2/dp-av2.py at main · computervisionpro/Python-Depth-Est-AV2 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
import cv2
import torch
import numpy as np
#import matplotlib.pyplot as plt

from depth_anything_v2.dpt import DepthAnythingV2

DEVICE = 'cuda' if torch.cuda.is_available() else 'mps' if torch.backends.mps.is_available() else 'cpu'
#DEVICE='cpu'
print(DEVICE)


model_configs = {
    'vits': {'encoder': 'vits', 'features': 64, 'out_channels': [48, 96, 192, 384]},
    'vitb': {'encoder': 'vitb', 'features': 128, 'out_channels': [96, 192, 384, 768]},
    'vitl': {'encoder': 'vitl', 'features': 256, 'out_channels': [256, 512, 1024, 1024]},
    'vitg': {'encoder': 'vitg', 'features': 384, 'out_channels': [1536, 1536, 1536, 1536]}
}

encoder = 'vits' # or 'vits', 'vitb', 'vitg'

model = DepthAnythingV2(**model_configs[encoder])
model.load_state_dict(torch.load(f'checkpoints/depth_anything_v2_{encoder}.pth',  weights_only=True)) #, map_location='cpu'))
model = model.to(DEVICE).eval()

raw_img = cv2.imread('./assets/examples/demo03.jpg')
print(raw_img.shape)


depth = model.infer_image(raw_img) # HxW raw depth map in numpy
print(depth.shape)
print(depth.dtype)


# Normalize to [0, 255]
depth_normalized = cv2.normalize(depth, None, 0, 255, cv2.NORM_MINMAX)
depth_scaled = depth_normalized.astype(np.uint8)

depth_c = cv2.applyColorMap(depth_scaled, cv2.COLORMAP_INFERNO)
cv2.imwrite('oop.jpg', depth_c)


#cv2.imshow('gg', depth_c)

print(depth)