Training in progress, epoch 1

Browse files

Files changed (4) hide show

config.json +28 -85
model.safetensors +2 -2
preprocessor_config.json +5 -5
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -1,98 +1,41 @@
 {
-  "_name_or_path": "PekingU/rtdetr_r50vd_coco_o365",
-  "activation_dropout": 0.0,
-  "activation_function": "silu",
-  "anchor_image_size": null,
   "architectures": [
-    "RTDetrForObjectDetection"
   ],
-  "attention_dropout": 0.0,
-  "auxiliary_loss": true,
-  "backbone": null,
-  "backbone_config": {
-    "model_type": "rt_detr_resnet",
-    "out_features": [
-      "stage2",
-      "stage3",
-      "stage4"
-    ],
-    "out_indices": [
-      2,
-      3,
-      4
-    ]
-  },
-  "backbone_kwargs": null,
-  "batch_norm_eps": 1e-05,
-  "box_noise_scale": 1.0,
-  "d_model": 256,
-  "decoder_activation_function": "relu",
-  "decoder_attention_heads": 8,
-  "decoder_ffn_dim": 1024,
-  "decoder_in_channels": [
-    256,
-    256,
-    256
-  ],
-  "decoder_layers": 6,
-  "decoder_n_points": 4,
-  "disable_custom_kernels": true,
-  "dropout": 0.0,
-  "encode_proj_layers": [
-    2
-  ],
-  "encoder_activation_function": "gelu",
-  "encoder_attention_heads": 8,
-  "encoder_ffn_dim": 1024,
-  "encoder_hidden_dim": 256,
-  "encoder_in_channels": [
-    512,
-    1024,
-    2048
-  ],
-  "encoder_layers": 1,
-  "eos_coefficient": 0.0001,
-  "eval_size": null,
-  "feat_strides": [
-    8,
-    16,
-    32
-  ],
-  "focal_loss_alpha": 0.75,
-  "focal_loss_gamma": 2.0,
-  "freeze_backbone_batch_norms": true,
-  "hidden_expansion": 1.0,
   "id2label": {
     "0": "logos",
     "1": "logos"
   },
-  "initializer_bias_prior_prob": null,
-  "initializer_range": 0.01,
-  "is_encoder_decoder": true,
   "label2id": {
     "logos": 1
   },
-  "label_noise_ratio": 0.5,
-  "layer_norm_eps": 1e-05,
-  "learn_initial_query": false,
-  "matcher_alpha": 0.25,
-  "matcher_bbox_cost": 5.0,
-  "matcher_class_cost": 2.0,
-  "matcher_gamma": 2.0,
-  "matcher_giou_cost": 2.0,
-  "model_type": "rt_detr",
-  "normalize_before": false,
-  "num_denoising": 100,
-  "num_feature_levels": 3,
-  "num_queries": 100,
-  "positional_encoding_temperature": 10000,
   "torch_dtype": "float32",
   "transformers_version": "4.49.0.dev0",
-  "use_focal_loss": true,
-  "use_pretrained_backbone": false,
-  "use_timm_backbone": false,
-  "weight_loss_bbox": 5.0,
-  "weight_loss_giou": 2.0,
-  "weight_loss_vfl": 1.0,
-  "with_box_refine": true
 }

 {
+  "_name_or_path": "hustvl/yolos-small",
   "architectures": [
+    "YolosForObjectDetection"
   ],
+  "attention_probs_dropout_prob": 0.0,
+  "auxiliary_loss": false,
+  "bbox_cost": 5,
+  "bbox_loss_coefficient": 5,
+  "class_cost": 1,
+  "eos_coefficient": 0.1,
+  "giou_cost": 2,
+  "giou_loss_coefficient": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 384,
   "id2label": {
     "0": "logos",
     "1": "logos"
   },
+  "image_size": [
+    512,
+    864
+  ],
+  "initializer_range": 0.02,
+  "intermediate_size": 1536,
   "label2id": {
     "logos": 1
   },
+  "layer_norm_eps": 1e-12,
+  "model_type": "yolos",
+  "num_attention_heads": 6,
+  "num_channels": 3,
+  "num_detection_tokens": 100,
+  "num_hidden_layers": 12,
+  "patch_size": 16,
+  "qkv_bias": true,
   "torch_dtype": "float32",
   "transformers_version": "4.49.0.dev0",
+  "use_mid_position_embeddings": true
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:17149cefd33efad8408e8e66fa986e479651eb6f4ab7deea11982173073b8886
-size 171534680

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b4ace90714f68c1152bd750bf67837715f561ef54ce6d7046a6e8bd7c9688d9
+size 122626212

preprocessor_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "do_convert_annotations": true,
-  "do_normalize": false,
-  "do_pad": false,
   "do_rescale": true,
   "do_resize": true,
   "format": "coco_detection",
@@ -10,7 +10,7 @@
     0.456,
     0.406
   ],
-  "image_processor_type": "RTDetrImageProcessor",
   "image_std": [
     0.229,
     0.224,
@@ -20,7 +20,7 @@
   "resample": 2,
   "rescale_factor": 0.00392156862745098,
   "size": {
-    "height": 640,
-    "width": 640
   }
 }

 {
   "do_convert_annotations": true,
+  "do_normalize": true,
+  "do_pad": true,
   "do_rescale": true,
   "do_resize": true,
   "format": "coco_detection",
     0.456,
     0.406
   ],
+  "image_processor_type": "YolosImageProcessor",
   "image_std": [
     0.229,
     0.224,
   "resample": 2,
   "rescale_factor": 0.00392156862745098,
   "size": {
+    "longest_edge": 1333,
+    "shortest_edge": 800
   }
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f564df4b1ac0a59b8e03c08673ba79a8fe4f793ab91a37a50b6ad4a121adc0dd
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1ea256e36e5887705954b5466860ad6f26877d8523a57b6721a0663ce8aa569
 size 5368