Ryukijano commited on
Commit
f8b8a9c
·
1 Parent(s): 3cc5a79

Upload MaskFormerForInstanceSegmentation

Browse files
Files changed (2) hide show
  1. config.json +437 -0
  2. pytorch_model.bin +3 -0
config.json ADDED
@@ -0,0 +1,437 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_commit_hash": "3325bd616fc2ef1c2e84aedacf8f7e37b8e6e8ce",
3
+ "_name_or_path": "Ryukijano/maskformer-swin-base-sceneparse-instance_collab",
4
+ "architectures": [
5
+ "MaskFormerForInstanceSegmentation"
6
+ ],
7
+ "backbone_config": {
8
+ "_name_or_path": "",
9
+ "add_cross_attention": false,
10
+ "architectures": null,
11
+ "attention_probs_dropout_prob": 0.0,
12
+ "bad_words_ids": null,
13
+ "begin_suppress_tokens": null,
14
+ "bos_token_id": null,
15
+ "chunk_size_feed_forward": 0,
16
+ "cross_attention_hidden_size": null,
17
+ "decoder_start_token_id": null,
18
+ "depths": [
19
+ 2,
20
+ 2,
21
+ 18,
22
+ 2
23
+ ],
24
+ "diversity_penalty": 0.0,
25
+ "do_sample": false,
26
+ "drop_path_rate": 0.3,
27
+ "early_stopping": false,
28
+ "embed_dim": 128,
29
+ "encoder_no_repeat_ngram_size": 0,
30
+ "encoder_stride": 32,
31
+ "eos_token_id": null,
32
+ "exponential_decay_length_penalty": null,
33
+ "finetuning_task": null,
34
+ "forced_bos_token_id": null,
35
+ "forced_eos_token_id": null,
36
+ "hidden_act": "gelu",
37
+ "hidden_dropout_prob": 0.0,
38
+ "hidden_size": 1024,
39
+ "id2label": {
40
+ "0": "LABEL_0",
41
+ "1": "LABEL_1"
42
+ },
43
+ "image_size": 384,
44
+ "in_channels": 3,
45
+ "initializer_range": 0.02,
46
+ "is_decoder": false,
47
+ "is_encoder_decoder": false,
48
+ "label2id": {
49
+ "LABEL_0": 0,
50
+ "LABEL_1": 1
51
+ },
52
+ "layer_norm_eps": 1e-05,
53
+ "length_penalty": 1.0,
54
+ "max_length": 20,
55
+ "min_length": 0,
56
+ "mlp_ratio": 4.0,
57
+ "model_type": "swin",
58
+ "no_repeat_ngram_size": 0,
59
+ "num_beam_groups": 1,
60
+ "num_beams": 1,
61
+ "num_channels": 3,
62
+ "num_heads": [
63
+ 4,
64
+ 8,
65
+ 16,
66
+ 32
67
+ ],
68
+ "num_layers": 4,
69
+ "num_return_sequences": 1,
70
+ "out_features": [
71
+ "stage4"
72
+ ],
73
+ "out_indices": [
74
+ 4
75
+ ],
76
+ "output_attentions": false,
77
+ "output_hidden_states": false,
78
+ "output_scores": false,
79
+ "pad_token_id": null,
80
+ "patch_size": 4,
81
+ "path_norm": true,
82
+ "prefix": null,
83
+ "pretrain_img_size": 384,
84
+ "problem_type": null,
85
+ "pruned_heads": {},
86
+ "qkv_bias": true,
87
+ "remove_invalid_values": false,
88
+ "repetition_penalty": 1.0,
89
+ "return_dict": true,
90
+ "return_dict_in_generate": false,
91
+ "sep_token_id": null,
92
+ "stage_names": [
93
+ "stem",
94
+ "stage1",
95
+ "stage2",
96
+ "stage3",
97
+ "stage4"
98
+ ],
99
+ "suppress_tokens": null,
100
+ "task_specific_params": null,
101
+ "temperature": 1.0,
102
+ "tf_legacy_loss": false,
103
+ "tie_encoder_decoder": false,
104
+ "tie_word_embeddings": true,
105
+ "tokenizer_class": null,
106
+ "top_k": 50,
107
+ "top_p": 1.0,
108
+ "torch_dtype": null,
109
+ "torchscript": false,
110
+ "transformers_version": "4.28.0.dev0",
111
+ "typical_p": 1.0,
112
+ "use_absolute_embeddings": false,
113
+ "use_bfloat16": false,
114
+ "window_size": 12
115
+ },
116
+ "ce_weight": 1.0,
117
+ "cross_entropy_weight": 1.0,
118
+ "decoder_config": {
119
+ "_commit_hash": null,
120
+ "_name_or_path": "",
121
+ "activation_dropout": 0.0,
122
+ "activation_function": "relu",
123
+ "add_cross_attention": false,
124
+ "architectures": null,
125
+ "attention_dropout": 0.0,
126
+ "auxiliary_loss": false,
127
+ "backbone": "resnet50",
128
+ "backbone_config": null,
129
+ "bad_words_ids": null,
130
+ "bbox_cost": 5,
131
+ "bbox_loss_coefficient": 5,
132
+ "begin_suppress_tokens": null,
133
+ "bos_token_id": null,
134
+ "chunk_size_feed_forward": 0,
135
+ "class_cost": 1,
136
+ "cross_attention_hidden_size": null,
137
+ "d_model": 256,
138
+ "decoder_attention_heads": 8,
139
+ "decoder_ffn_dim": 2048,
140
+ "decoder_layerdrop": 0.0,
141
+ "decoder_layers": 6,
142
+ "decoder_start_token_id": null,
143
+ "dice_loss_coefficient": 1,
144
+ "dilation": false,
145
+ "diversity_penalty": 0.0,
146
+ "do_sample": false,
147
+ "dropout": 0.1,
148
+ "early_stopping": false,
149
+ "encoder_attention_heads": 8,
150
+ "encoder_ffn_dim": 2048,
151
+ "encoder_layerdrop": 0.0,
152
+ "encoder_layers": 6,
153
+ "encoder_no_repeat_ngram_size": 0,
154
+ "eos_coefficient": 0.1,
155
+ "eos_token_id": null,
156
+ "exponential_decay_length_penalty": null,
157
+ "finetuning_task": null,
158
+ "forced_bos_token_id": null,
159
+ "forced_eos_token_id": null,
160
+ "giou_cost": 2,
161
+ "giou_loss_coefficient": 2,
162
+ "id2label": {
163
+ "0": "LABEL_0",
164
+ "1": "LABEL_1"
165
+ },
166
+ "init_std": 0.02,
167
+ "init_xavier_std": 1.0,
168
+ "is_decoder": false,
169
+ "is_encoder_decoder": true,
170
+ "label2id": {
171
+ "LABEL_0": 0,
172
+ "LABEL_1": 1
173
+ },
174
+ "length_penalty": 1.0,
175
+ "mask_loss_coefficient": 1,
176
+ "max_length": 20,
177
+ "max_position_embeddings": 1024,
178
+ "min_length": 0,
179
+ "model_type": "detr",
180
+ "no_repeat_ngram_size": 0,
181
+ "num_beam_groups": 1,
182
+ "num_beams": 1,
183
+ "num_channels": 3,
184
+ "num_hidden_layers": 6,
185
+ "num_queries": 100,
186
+ "num_return_sequences": 1,
187
+ "output_attentions": false,
188
+ "output_hidden_states": false,
189
+ "output_scores": false,
190
+ "pad_token_id": null,
191
+ "position_embedding_type": "sine",
192
+ "prefix": null,
193
+ "problem_type": null,
194
+ "pruned_heads": {},
195
+ "remove_invalid_values": false,
196
+ "repetition_penalty": 1.0,
197
+ "return_dict": true,
198
+ "return_dict_in_generate": false,
199
+ "scale_embedding": false,
200
+ "sep_token_id": null,
201
+ "suppress_tokens": null,
202
+ "task_specific_params": null,
203
+ "temperature": 1.0,
204
+ "tf_legacy_loss": false,
205
+ "tie_encoder_decoder": false,
206
+ "tie_word_embeddings": true,
207
+ "tokenizer_class": null,
208
+ "top_k": 50,
209
+ "top_p": 1.0,
210
+ "torch_dtype": null,
211
+ "torchscript": false,
212
+ "transformers_version": "4.17.0.dev0",
213
+ "typical_p": 1.0,
214
+ "use_bfloat16": false,
215
+ "use_pretrained_backbone": true,
216
+ "use_timm_backbone": true
217
+ },
218
+ "dice_weight": 1.0,
219
+ "fpn_feature_size": 256,
220
+ "id2label": {
221
+ "0": "bed",
222
+ "1": "windowpane",
223
+ "2": "cabinet",
224
+ "3": "person",
225
+ "4": "door",
226
+ "5": "table",
227
+ "6": "curtain",
228
+ "7": "chair",
229
+ "8": "car",
230
+ "9": "painting",
231
+ "10": "sofa",
232
+ "11": "shelf",
233
+ "12": "mirror",
234
+ "13": "armchair",
235
+ "14": "seat",
236
+ "15": "fence",
237
+ "16": "desk",
238
+ "17": "wardrobe",
239
+ "18": "lamp",
240
+ "19": "bathtub",
241
+ "20": "railing",
242
+ "21": "cushion",
243
+ "22": "box",
244
+ "23": "column",
245
+ "24": "signboard",
246
+ "25": "chest of drawers",
247
+ "26": "counter",
248
+ "27": "sink",
249
+ "28": "fireplace",
250
+ "29": "refrigerator",
251
+ "30": "stairs",
252
+ "31": "case",
253
+ "32": "pool table",
254
+ "33": "pillow",
255
+ "34": "screen door",
256
+ "35": "bookcase",
257
+ "36": "coffee table",
258
+ "37": "toilet",
259
+ "38": "flower",
260
+ "39": "book",
261
+ "40": "bench",
262
+ "41": "countertop",
263
+ "42": "stove",
264
+ "43": "palm",
265
+ "44": "kitchen island",
266
+ "45": "computer",
267
+ "46": "swivel chair",
268
+ "47": "boat",
269
+ "48": "arcade machine",
270
+ "49": "bus",
271
+ "50": "towel",
272
+ "51": "light",
273
+ "52": "truck",
274
+ "53": "chandelier",
275
+ "54": "awning",
276
+ "55": "streetlight",
277
+ "56": "booth",
278
+ "57": "television receiver",
279
+ "58": "airplane",
280
+ "59": "apparel",
281
+ "60": "pole",
282
+ "61": "bannister",
283
+ "62": "ottoman",
284
+ "63": "bottle",
285
+ "64": "van",
286
+ "65": "ship",
287
+ "66": "fountain",
288
+ "67": "washer",
289
+ "68": "plaything",
290
+ "69": "stool",
291
+ "70": "barrel",
292
+ "71": "basket",
293
+ "72": "bag",
294
+ "73": "minibike",
295
+ "74": "oven",
296
+ "75": "ball",
297
+ "76": "food",
298
+ "77": "step",
299
+ "78": "trade name",
300
+ "79": "microwave",
301
+ "80": "pot",
302
+ "81": "animal",
303
+ "82": "bicycle",
304
+ "83": "dishwasher",
305
+ "84": "screen",
306
+ "85": "sculpture",
307
+ "86": "hood",
308
+ "87": "sconce",
309
+ "88": "vase",
310
+ "89": "traffic light",
311
+ "90": "tray",
312
+ "91": "ashcan",
313
+ "92": "fan",
314
+ "93": "plate",
315
+ "94": "monitor",
316
+ "95": "bulletin board",
317
+ "96": "radiator",
318
+ "97": "glass",
319
+ "98": "clock",
320
+ "99": "flag"
321
+ },
322
+ "init_std": 0.02,
323
+ "init_xavier_std": 1.0,
324
+ "label2id": {
325
+ "airplane": 58,
326
+ "animal": 81,
327
+ "apparel": 59,
328
+ "arcade machine": 48,
329
+ "armchair": 13,
330
+ "ashcan": 91,
331
+ "awning": 54,
332
+ "bag": 72,
333
+ "ball": 75,
334
+ "bannister": 61,
335
+ "barrel": 70,
336
+ "basket": 71,
337
+ "bathtub": 19,
338
+ "bed": 0,
339
+ "bench": 40,
340
+ "bicycle": 82,
341
+ "boat": 47,
342
+ "book": 39,
343
+ "bookcase": 35,
344
+ "booth": 56,
345
+ "bottle": 63,
346
+ "box": 22,
347
+ "bulletin board": 95,
348
+ "bus": 49,
349
+ "cabinet": 2,
350
+ "car": 8,
351
+ "case": 31,
352
+ "chair": 7,
353
+ "chandelier": 53,
354
+ "chest of drawers": 25,
355
+ "clock": 98,
356
+ "coffee table": 36,
357
+ "column": 23,
358
+ "computer": 45,
359
+ "counter": 26,
360
+ "countertop": 41,
361
+ "curtain": 6,
362
+ "cushion": 21,
363
+ "desk": 16,
364
+ "dishwasher": 83,
365
+ "door": 4,
366
+ "fan": 92,
367
+ "fence": 15,
368
+ "fireplace": 28,
369
+ "flag": 99,
370
+ "flower": 38,
371
+ "food": 76,
372
+ "fountain": 66,
373
+ "glass": 97,
374
+ "hood": 86,
375
+ "kitchen island": 44,
376
+ "lamp": 18,
377
+ "light": 51,
378
+ "microwave": 79,
379
+ "minibike": 73,
380
+ "mirror": 12,
381
+ "monitor": 94,
382
+ "ottoman": 62,
383
+ "oven": 74,
384
+ "painting": 9,
385
+ "palm": 43,
386
+ "person": 3,
387
+ "pillow": 33,
388
+ "plate": 93,
389
+ "plaything": 68,
390
+ "pole": 60,
391
+ "pool table": 32,
392
+ "pot": 80,
393
+ "radiator": 96,
394
+ "railing": 20,
395
+ "refrigerator": 29,
396
+ "sconce": 87,
397
+ "screen": 84,
398
+ "screen door": 34,
399
+ "sculpture": 85,
400
+ "seat": 14,
401
+ "shelf": 11,
402
+ "ship": 65,
403
+ "signboard": 24,
404
+ "sink": 27,
405
+ "sofa": 10,
406
+ "stairs": 30,
407
+ "step": 77,
408
+ "stool": 69,
409
+ "stove": 42,
410
+ "streetlight": 55,
411
+ "swivel chair": 46,
412
+ "table": 5,
413
+ "television receiver": 57,
414
+ "toilet": 37,
415
+ "towel": 50,
416
+ "trade name": 78,
417
+ "traffic light": 89,
418
+ "tray": 90,
419
+ "truck": 52,
420
+ "van": 64,
421
+ "vase": 88,
422
+ "wardrobe": 17,
423
+ "washer": 67,
424
+ "windowpane": 1
425
+ },
426
+ "mask_feature_size": 256,
427
+ "mask_weight": 20.0,
428
+ "model_type": "maskformer",
429
+ "no_object_weight": 0.1,
430
+ "num_attention_heads": 8,
431
+ "num_hidden_layers": 6,
432
+ "num_queries": 100,
433
+ "output_auxiliary_logits": null,
434
+ "torch_dtype": "float32",
435
+ "transformers_version": null,
436
+ "use_auxiliary_loss": false
437
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bab885845fb27354507c03644907f705707b13785cfb864a5eb1b2979645715
3
+ size 411491437