Update config.json
Browse files- config.json +4 -5
config.json
CHANGED
@@ -56,16 +56,16 @@
|
|
56 |
},
|
57 |
"vision_config": {
|
58 |
"model_type": "davit",
|
59 |
-
"drop_path_rate": 0.1,
|
60 |
"patch_size": [7, 3, 3, 3],
|
61 |
"patch_stride": [4, 2, 2, 2],
|
62 |
"patch_padding": [3, 1, 1, 1],
|
63 |
"patch_prenorm": [false, true, true, true],
|
64 |
-
"enable_checkpoint": false,
|
65 |
"dim_embed": [256, 512, 1024, 2048],
|
66 |
"num_heads": [8, 16, 32, 64],
|
67 |
"num_groups": [8, 16, 32, 64],
|
68 |
-
"depths": [1, 1, 9, 1],
|
69 |
"window_size": 12,
|
70 |
"projection_dim": 1024,
|
71 |
"visual_temporal_embedding": {
|
@@ -79,7 +79,6 @@
|
|
79 |
"image_feature_source": ["spatial_avg_pool", "temporal_avg_pool"]
|
80 |
},
|
81 |
"vocab_size": 51289,
|
82 |
-
"
|
83 |
-
"transformers_version": "4.41.0.dev0",
|
84 |
"is_encoder_decoder": true
|
85 |
}
|
|
|
56 |
},
|
57 |
"vision_config": {
|
58 |
"model_type": "davit",
|
59 |
+
"drop_path_rate": 0.1,
|
60 |
"patch_size": [7, 3, 3, 3],
|
61 |
"patch_stride": [4, 2, 2, 2],
|
62 |
"patch_padding": [3, 1, 1, 1],
|
63 |
"patch_prenorm": [false, true, true, true],
|
64 |
+
"enable_checkpoint": false,
|
65 |
"dim_embed": [256, 512, 1024, 2048],
|
66 |
"num_heads": [8, 16, 32, 64],
|
67 |
"num_groups": [8, 16, 32, 64],
|
68 |
+
"depths": [1, 1, 9, 1],
|
69 |
"window_size": 12,
|
70 |
"projection_dim": 1024,
|
71 |
"visual_temporal_embedding": {
|
|
|
79 |
"image_feature_source": ["spatial_avg_pool", "temporal_avg_pool"]
|
80 |
},
|
81 |
"vocab_size": 51289,
|
82 |
+
"transformers_version": "4.48.3",
|
|
|
83 |
"is_encoder_decoder": true
|
84 |
}
|