File size: 2,024 Bytes
79a1f97 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 |
{
"add_projection": false,
"architectures": [
"ZoeDepthForDepthEstimation"
],
"attractor_alpha": 1000,
"attractor_gamma": 2,
"attractor_kind": "mean",
"backbone": null,
"backbone_config": {
"hidden_size": 1024,
"image_size": 384,
"intermediate_size": 4096,
"model_type": "beit",
"num_attention_heads": 16,
"num_hidden_layers": 24,
"out_features": [
"stage6",
"stage12",
"stage18",
"stage24"
],
"out_indices": [
6,
12,
18,
24
],
"reshape_hidden_states": false,
"stage_names": [
"stem",
"stage1",
"stage2",
"stage3",
"stage4",
"stage5",
"stage6",
"stage7",
"stage8",
"stage9",
"stage10",
"stage11",
"stage12",
"stage13",
"stage14",
"stage15",
"stage16",
"stage17",
"stage18",
"stage19",
"stage20",
"stage21",
"stage22",
"stage23",
"stage24"
],
"use_relative_position_bias": true
},
"backbone_hidden_size": 1024,
"batch_norm_eps": 1e-05,
"bin_centers_type": "softplus",
"bin_configurations": [
{
"max_depth": 10.0,
"min_depth": 0.001,
"n_bins": 64,
"name": "nyu"
},
{
"max_depth": 80.0,
"min_depth": 0.001,
"n_bins": 64,
"name": "kitti"
}
],
"bin_embedding_dim": 128,
"bottleneck_features": 256,
"fusion_hidden_size": 256,
"head_in_index": -1,
"hidden_act": "gelu",
"initializer_range": 0.02,
"max_temp": 50.0,
"min_temp": 0.0212,
"model_type": "zoedepth",
"neck_hidden_sizes": [
256,
512,
1024,
1024
],
"num_attractors": [
16,
8,
4,
1
],
"readout_type": "project",
"reassemble_factors": [
4,
2,
1,
0.5
],
"torch_dtype": "float32",
"transformers_version": "4.41.0.dev0",
"use_batch_norm_in_fusion_residual": false,
"use_bias_in_fusion_residual": null,
"use_pretrained_backbone": false
}
|