Commit
·
d60c9ff
1
Parent(s):
e5ecbf3
Add model
Browse files- config.json +45 -56
config.json
CHANGED
|
@@ -2145,51 +2145,19 @@
|
|
| 2145 |
"typical_p": 1.0,
|
| 2146 |
"use_bfloat16": false
|
| 2147 |
},
|
| 2148 |
-
"
|
| 2149 |
-
|
| 2150 |
-
|
| 2151 |
-
|
| 2152 |
-
|
| 2153 |
-
|
| 2154 |
-
|
| 2155 |
-
|
| 2156 |
-
|
| 2157 |
-
|
| 2158 |
-
|
| 2159 |
-
|
| 2160 |
-
|
| 2161 |
-
"pre_norm": false,
|
| 2162 |
-
"query_dec_layers": 2,
|
| 2163 |
-
"use_task_norm": true
|
| 2164 |
-
},
|
| 2165 |
-
"general_config": {
|
| 2166 |
-
"class_weight": 2.0,
|
| 2167 |
-
"contrastive_temperature": 0.07,
|
| 2168 |
-
"contrastive_weight": 0.5,
|
| 2169 |
-
"deep_supervision": true,
|
| 2170 |
-
"dice_weight": 5.0,
|
| 2171 |
-
"ignore_value": 255,
|
| 2172 |
-
"importance_sample_ratio": 0.75,
|
| 2173 |
-
"init_std": 0.02,
|
| 2174 |
-
"init_xavier_std": 1.0,
|
| 2175 |
-
"is_train": false,
|
| 2176 |
-
"layer_norm_eps": 1e-05,
|
| 2177 |
-
"mask_weight": 5.0,
|
| 2178 |
-
"no_object_weight": 0.1,
|
| 2179 |
-
"num_classes": 133,
|
| 2180 |
-
"num_queries": 150,
|
| 2181 |
-
"output_auxiliary_logits": true,
|
| 2182 |
-
"oversample_ratio": 3.0,
|
| 2183 |
-
"strides": [
|
| 2184 |
-
4,
|
| 2185 |
-
8,
|
| 2186 |
-
16,
|
| 2187 |
-
32
|
| 2188 |
-
],
|
| 2189 |
-
"train_num_points": 12544,
|
| 2190 |
-
"use_auxiliary_loss": true
|
| 2191 |
-
},
|
| 2192 |
-
"hidden_size": 256,
|
| 2193 |
"id2label": {
|
| 2194 |
"0": "person",
|
| 2195 |
"1": "bicycle",
|
|
@@ -2325,8 +2293,11 @@
|
|
| 2325 |
"131": "wall-other-merged",
|
| 2326 |
"132": "rug-merged"
|
| 2327 |
},
|
|
|
|
|
|
|
| 2328 |
"init_std": 0.02,
|
| 2329 |
"init_xavier_std": 1.0,
|
|
|
|
| 2330 |
"label2id": {
|
| 2331 |
"airplane": 4,
|
| 2332 |
"apple": 47,
|
|
@@ -2462,21 +2433,39 @@
|
|
| 2462 |
"wine glass": 40,
|
| 2463 |
"zebra": 22
|
| 2464 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2465 |
"model_type": "oneformer",
|
|
|
|
|
|
|
| 2466 |
"num_attention_heads": 8,
|
|
|
|
| 2467 |
"num_hidden_layers": 10,
|
|
|
|
| 2468 |
"output_attentions": true,
|
|
|
|
| 2469 |
"output_hidden_states": true,
|
| 2470 |
-
"
|
| 2471 |
-
|
| 2472 |
-
|
| 2473 |
-
|
| 2474 |
-
|
| 2475 |
-
|
| 2476 |
-
|
| 2477 |
-
|
| 2478 |
-
|
| 2479 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2480 |
"torch_dtype": "float32",
|
| 2481 |
-
"
|
|
|
|
|
|
|
|
|
|
| 2482 |
}
|
|
|
|
| 2145 |
"typical_p": 1.0,
|
| 2146 |
"use_bfloat16": false
|
| 2147 |
},
|
| 2148 |
+
"class_weight": 2.0,
|
| 2149 |
+
"common_stride": 4,
|
| 2150 |
+
"contrastive_temperature": 0.07,
|
| 2151 |
+
"contrastive_weight": 0.5,
|
| 2152 |
+
"conv_dim": 256,
|
| 2153 |
+
"decoder_layers": 10,
|
| 2154 |
+
"dice_weight": 5.0,
|
| 2155 |
+
"dim_feedforward": 2048,
|
| 2156 |
+
"dropout": 0.1,
|
| 2157 |
+
"encoder_feedforward_dim": 1024,
|
| 2158 |
+
"encoder_layers": 6,
|
| 2159 |
+
"enforce_input_proj": false,
|
| 2160 |
+
"hidden_dim": 256,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2161 |
"id2label": {
|
| 2162 |
"0": "person",
|
| 2163 |
"1": "bicycle",
|
|
|
|
| 2293 |
"131": "wall-other-merged",
|
| 2294 |
"132": "rug-merged"
|
| 2295 |
},
|
| 2296 |
+
"ignore_value": 255,
|
| 2297 |
+
"importance_sample_ratio": 0.75,
|
| 2298 |
"init_std": 0.02,
|
| 2299 |
"init_xavier_std": 1.0,
|
| 2300 |
+
"is_training": false,
|
| 2301 |
"label2id": {
|
| 2302 |
"airplane": 4,
|
| 2303 |
"apple": 47,
|
|
|
|
| 2433 |
"wine glass": 40,
|
| 2434 |
"zebra": 22
|
| 2435 |
},
|
| 2436 |
+
"layer_norm_eps": 1e-05,
|
| 2437 |
+
"mask_dim": 256,
|
| 2438 |
+
"mask_weight": 5.0,
|
| 2439 |
+
"max_seq_len": 77,
|
| 2440 |
"model_type": "oneformer",
|
| 2441 |
+
"no_object_weight": 0.1,
|
| 2442 |
+
"norm": "GN",
|
| 2443 |
"num_attention_heads": 8,
|
| 2444 |
+
"num_classes": 133,
|
| 2445 |
"num_hidden_layers": 10,
|
| 2446 |
+
"num_queries": 150,
|
| 2447 |
"output_attentions": true,
|
| 2448 |
+
"output_auxiliary_logits": true,
|
| 2449 |
"output_hidden_states": true,
|
| 2450 |
+
"oversample_ratio": 3.0,
|
| 2451 |
+
"pre_norm": false,
|
| 2452 |
+
"query_dec_layers": 2,
|
| 2453 |
+
"strides": [
|
| 2454 |
+
4,
|
| 2455 |
+
8,
|
| 2456 |
+
16,
|
| 2457 |
+
32
|
| 2458 |
+
],
|
| 2459 |
+
"task_seq_len": 77,
|
| 2460 |
+
"text_encoder_context_length": 77,
|
| 2461 |
+
"text_encoder_n_ctx": 16,
|
| 2462 |
+
"text_encoder_num_layers": 6,
|
| 2463 |
+
"text_encoder_proj_layers": 2,
|
| 2464 |
+
"text_encoder_vocab_size": 49408,
|
| 2465 |
+
"text_encoder_width": 256,
|
| 2466 |
"torch_dtype": "float32",
|
| 2467 |
+
"train_num_points": 12544,
|
| 2468 |
+
"transformers_version": null,
|
| 2469 |
+
"use_auxiliary_loss": true,
|
| 2470 |
+
"use_task_norm": true
|
| 2471 |
}
|