_attn_implementation_autoset: value: true _name_or_path: value: facebook/detr-resnet-50-dc5 _wandb: value: cli_version: 0.18.7 m: - "1": train/learning_rate "5": 2 "6": - 1 - 3 "7": [] - "1": train/global_step "6": - 3 "7": [] - "1": eval/mar_100 "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_50 "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_medium "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_100_balloon "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_small "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_medium "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_large "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_balloon "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_object "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_75 "5": 2 "6": - 1 - 3 "7": [] - "1": eval/steps_per_second "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_1 "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_small "5": 2 "6": - 1 - 3 "7": [] - "1": eval/map_large "5": 2 "6": - 1 - 3 "7": [] - "1": eval/loss "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_100_object "5": 2 "6": - 1 - 3 "7": [] - "1": eval/samples_per_second "5": 2 "6": - 1 - 3 "7": [] - "1": eval/mar_10 "5": 2 "6": - 1 - 3 "7": [] - "1": train/loss "5": 2 "6": - 1 - 3 "7": [] - "1": train/grad_norm "5": 2 "6": - 1 - 3 "7": [] - "1": train/epoch "5": 2 "6": - 1 - 3 "7": [] - "1": eval/runtime "5": 2 "6": - 1 - 3 "7": [] python_version: 3.10.14 t: "1": - 1 - 2 - 3 - 5 - 11 - 12 - 41 - 49 - 51 - 53 - 55 - 63 - 71 - 80 - 105 "2": - 1 - 2 - 3 - 5 - 11 - 12 - 41 - 49 - 51 - 53 - 55 - 63 - 71 - 80 - 105 "3": - 7 - 16 - 19 - 23 - 55 - 62 - 66 "4": 3.10.14 "5": 0.18.7 "6": 4.46.3 "8": - 1 - 2 - 5 "9": "1": transformers_trainer "12": 0.18.7 "13": linux-x86_64 accelerator_config: value: dispatch_batches: null even_batches: true gradient_accumulation_kwargs: null non_blocking: false split_batches: false use_seedable_sampler: true activation_dropout: value: 0 activation_function: value: relu adafactor: value: false adam_beta1: value: 0.9 adam_beta2: value: 0.999 adam_epsilon: value: 1e-08 add_cross_attention: value: false architectures: value: - DetrForObjectDetection attention_dropout: value: 0 auto_find_batch_size: value: false auxiliary_loss: value: false average_tokens_across_devices: value: false backbone: value: resnet50 backbone_config: value: null backbone_kwargs: value: in_chans: 3 out_indices: - 1 - 2 - 3 - 4 output_stride: 16 bad_words_ids: value: null batch_eval_metrics: value: true batch_size: value: 4 bbox_cost: value: 5 bbox_loss_coefficient: value: 5 begin_suppress_tokens: value: null bf16: value: false bf16_full_eval: value: false bos_token_id: value: null chunk_size_feed_forward: value: 0 class_cost: value: 1 classifier_dropout: value: 0 cross_attention_hidden_size: value: null d_model: value: 256 data_seed: value: null dataloader_drop_last: value: false dataloader_num_workers: value: 0 dataloader_persistent_workers: value: false dataloader_pin_memory: value: true dataloader_prefetch_factor: value: null ddp_backend: value: null ddp_broadcast_buffers: value: null ddp_bucket_cap_mb: value: null ddp_find_unused_parameters: value: null ddp_timeout: value: 1800 debug: value: [] decoder_attention_heads: value: 8 decoder_ffn_dim: value: 2048 decoder_layerdrop: value: 0 decoder_layers: value: 6 decoder_start_token_id: value: null deepspeed: value: null dice_loss_coefficient: value: 1 dilation: value: true disable_tqdm: value: false dispatch_batches: value: null diversity_penalty: value: 0 do_eval: value: true do_predict: value: false do_sample: value: false do_train: value: false dropout: value: 0.1 early_stopping: value: false encoder_attention_heads: value: 8 encoder_ffn_dim: value: 2048 encoder_layerdrop: value: 0 encoder_layers: value: 6 encoder_no_repeat_ngram_size: value: 0 eos_coefficient: value: 0.1 eos_token_id: value: null eval_accumulation_steps: value: null eval_delay: value: 0 eval_do_concat_batches: value: true eval_on_start: value: false eval_steps: value: 10 eval_strategy: value: steps eval_use_gather_object: value: false evaluation_strategy: value: steps exponential_decay_length_penalty: value: null finetuning_task: value: null forced_bos_token_id: value: null forced_eos_token_id: value: null fp16: value: true fp16_backend: value: auto fp16_full_eval: value: false fp16_opt_level: value: O1 fsdp: value: [] fsdp_config: value: min_num_params: 0 xla: false xla_fsdp_grad_ckpt: false xla_fsdp_v2: false fsdp_min_num_params: value: 0 fsdp_transformer_layer_cls_to_wrap: value: null full_determinism: value: false giou_cost: value: 2 giou_loss_coefficient: value: 2 gradient_accumulation_steps: value: 1 gradient_checkpointing: value: false gradient_checkpointing_kwargs: value: null greater_is_better: value: null group_by_length: value: false half_precision_backend: value: auto hub_always_push: value: false hub_model_id: value: null hub_private_repo: value: false hub_strategy: value: every_save hub_token: value: id2label: value: "0": object "1": balloon ignore_data_skip: value: false include_for_metrics: value: [] include_inputs_for_metrics: value: false include_num_input_tokens_seen: value: false include_tokens_per_second: value: false init_std: value: 0.02 init_xavier_std: value: 1 is_decoder: value: false is_encoder_decoder: value: true jit_mode_eval: value: false label_names: value: null label_smoothing_factor: value: 0 label2id: value: balloon: 1 object: 0 learning_rate: value: 3e-05 length_column_name: value: length length_penalty: value: 1 load_best_model_at_end: value: false local_rank: value: 0 log_level: value: passive log_level_replica: value: warning log_on_each_node: value: true logging_dir: value: ./runs/Nov27_18-03-24_f5b68522d064 logging_first_step: value: false logging_nan_inf_filter: value: true logging_steps: value: 5 logging_strategy: value: steps lr_scheduler_type: value: linear mask_loss_coefficient: value: 1 max_grad_norm: value: 1 max_length: value: 20 max_position_embeddings: value: 1024 max_steps: value: 125 metric_for_best_model: value: null min_length: value: 0 model/num_parameters: value: 41501895 model_type: value: detr mp_parameters: value: "" neftune_noise_alpha: value: null no_cuda: value: false no_repeat_ngram_size: value: 0 num_beam_groups: value: 1 num_beams: value: 1 num_channels: value: 3 num_epochs: value: 10 num_hidden_layers: value: 6 num_queries: value: 100 num_return_sequences: value: 1 num_train_epochs: value: 3 optim: value: adamw_torch optim_args: value: null optim_target_modules: value: null output_attentions: value: false output_dir: value: . output_hidden_states: value: false output_scores: value: false overwrite_output_dir: value: false pad_token_id: value: null past_index: value: -1 per_device_eval_batch_size: value: 4 per_device_train_batch_size: value: 4 per_gpu_eval_batch_size: value: null per_gpu_train_batch_size: value: null position_embedding_type: value: sine prediction_loss_only: value: false prefix: value: null problem_type: value: null push_to_hub: value: true push_to_hub_model_id: value: null push_to_hub_organization: value: null push_to_hub_token: value: ray_scope: value: last remove_invalid_values: value: false remove_unused_columns: value: false repetition_penalty: value: 1 report_to: value: - wandb restore_callback_states_from_checkpoint: value: false resume_from_checkpoint: value: null return_dict: value: true return_dict_in_generate: value: false run_name: value: . save_on_each_node: value: false save_only_model: value: false save_safetensors: value: true save_steps: value: 10 save_strategy: value: steps save_total_limit: value: 2 scale_embedding: value: false seed: value: 42 sep_token_id: value: null skip_memory_metrics: value: true split_batches: value: null suppress_tokens: value: null task_specific_params: value: null temperature: value: 1 tf_legacy_loss: value: false tf32: value: null tie_encoder_decoder: value: false tie_word_embeddings: value: true tokenizer_class: value: null top_k: value: 50 top_p: value: 1 torch_compile: value: false torch_compile_backend: value: null torch_compile_mode: value: null torch_dtype: value: null torch_empty_cache_steps: value: null torchdynamo: value: null torchscript: value: false tpu_metrics_debug: value: false tpu_num_cores: value: null transformers_version: value: 4.46.3 typical_p: value: 1 use_bfloat16: value: false use_cpu: value: false use_ipex: value: false use_legacy_prediction_loop: value: false use_liger_kernel: value: false use_mps_device: value: false use_pretrained_backbone: value: true use_timm_backbone: value: true warmup_ratio: value: 0 warmup_steps: value: 0 weight_decay: value: 0.0001