MalyO2 commited on
Commit
7b8d0ef
·
verified ·
1 Parent(s): 80f66b2

Training in progress, step 10

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29f1460d1b2b606d31b2db9f60bcf4407838dd6e819cf7f1c4e37c24e5df45c8
3
  size 166495852
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d53021adcd538c8a65f88bdb41cbe0eadccdb7a40ef24891b48970c95e59cab2
3
  size 166495852
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96fff52f29b2c66c78c1e5d63fef22d949b3961b285c6678d6697d7535af9632
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c5c51611eed8d23035fec4b42ac33b6d1ec20f029f82b22506aa4229a06cf3
3
  size 5240
wandb/debug-internal.log CHANGED
@@ -1,17 +1,16 @@
1
- {"time":"2024-11-27T18:41:07.005767698Z","level":"INFO","msg":"using version","core version":"0.18.7"}
2
- {"time":"2024-11-27T18:41:07.005792171Z","level":"INFO","msg":"created symlink","path":"/kaggle/working/wandb/run-20241127_184106-b3av6kjn/logs/debug-core.log"}
3
- {"time":"2024-11-27T18:41:07.108926428Z","level":"INFO","msg":"created new stream","id":"b3av6kjn"}
4
- {"time":"2024-11-27T18:41:07.10895689Z","level":"INFO","msg":"stream: started","id":"b3av6kjn"}
5
- {"time":"2024-11-27T18:41:07.109002548Z","level":"INFO","msg":"writer: Do: started","stream_id":"b3av6kjn"}
6
- {"time":"2024-11-27T18:41:07.1090194Z","level":"INFO","msg":"handler: started","stream_id":"b3av6kjn"}
7
- {"time":"2024-11-27T18:41:07.109088878Z","level":"INFO","msg":"sender: started","stream_id":"b3av6kjn"}
8
- {"time":"2024-11-27T18:41:08.603139546Z","level":"INFO","msg":"Starting system monitor"}
9
- {"time":"2024-11-27T18:41:09.228871854Z","level":"INFO","msg":"Pausing system monitor"}
10
- {"time":"2024-11-27T18:41:09.22893535Z","level":"INFO","msg":"Resuming system monitor"}
11
- {"time":"2024-11-27T18:41:09.228942454Z","level":"INFO","msg":"Pausing system monitor"}
12
- {"time":"2024-11-27T18:41:09.228947627Z","level":"INFO","msg":"Resuming system monitor"}
13
- {"time":"2024-11-27T18:41:09.228952355Z","level":"INFO","msg":"Pausing system monitor"}
14
- {"time":"2024-11-27T18:41:09.233660913Z","level":"INFO","msg":"Resuming system monitor"}
15
- {"time":"2024-11-27T18:41:10.596026715Z","level":"INFO","msg":"Pausing system monitor"}
16
- {"time":"2024-11-27T18:41:10.864229971Z","level":"INFO","msg":"Resuming system monitor"}
17
- {"time":"2024-11-27T18:46:20.059842369Z","level":"INFO","msg":"Pausing system monitor"}
 
1
+ {"time":"2024-11-27T18:49:14.423820992Z","level":"INFO","msg":"using version","core version":"0.18.7"}
2
+ {"time":"2024-11-27T18:49:14.423845654Z","level":"INFO","msg":"created symlink","path":"/kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug-core.log"}
3
+ {"time":"2024-11-27T18:49:14.527132732Z","level":"INFO","msg":"created new stream","id":"lig8s4o3"}
4
+ {"time":"2024-11-27T18:49:14.527165937Z","level":"INFO","msg":"stream: started","id":"lig8s4o3"}
5
+ {"time":"2024-11-27T18:49:14.527203552Z","level":"INFO","msg":"writer: Do: started","stream_id":"lig8s4o3"}
6
+ {"time":"2024-11-27T18:49:14.527212524Z","level":"INFO","msg":"handler: started","stream_id":"lig8s4o3"}
7
+ {"time":"2024-11-27T18:49:14.527250309Z","level":"INFO","msg":"sender: started","stream_id":"lig8s4o3"}
8
+ {"time":"2024-11-27T18:49:16.008654965Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-11-27T18:49:16.637945267Z","level":"INFO","msg":"Pausing system monitor"}
10
+ {"time":"2024-11-27T18:49:16.638015431Z","level":"INFO","msg":"Resuming system monitor"}
11
+ {"time":"2024-11-27T18:49:16.638022617Z","level":"INFO","msg":"Pausing system monitor"}
12
+ {"time":"2024-11-27T18:49:16.638027426Z","level":"INFO","msg":"Resuming system monitor"}
13
+ {"time":"2024-11-27T18:49:16.638031951Z","level":"INFO","msg":"Pausing system monitor"}
14
+ {"time":"2024-11-27T18:49:16.641816205Z","level":"INFO","msg":"Resuming system monitor"}
15
+ {"time":"2024-11-27T18:49:17.996060396Z","level":"INFO","msg":"Pausing system monitor"}
16
+ {"time":"2024-11-27T18:49:18.259742288Z","level":"INFO","msg":"Resuming system monitor"}
 
wandb/debug.log CHANGED
@@ -1,44 +1,42 @@
1
- 2024-11-27 18:41:07,000 INFO MainThread:1986 [wandb_setup.py:_flush():79] Current SDK version is 0.18.7
2
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Configure stats pid to 1986
3
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Loading settings from /root/.config/wandb/settings
4
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Loading settings from /kaggle/working/wandb/settings
5
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Loading settings from environment variables: {}
6
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
7
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program': '<python with no main file>'}
8
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_setup.py:_flush():79] Applying login settings: {}
9
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:_log_setup():533] Logging user logs to /kaggle/working/wandb/run-20241127_184106-b3av6kjn/logs/debug.log
10
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:_log_setup():534] Logging internal logs to /kaggle/working/wandb/run-20241127_184106-b3av6kjn/logs/debug-internal.log
11
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:_jupyter_setup():479] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7cac14039b40>
12
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:init():619] calling init triggers
13
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:init():626] wandb.init called with sweep_config: {}
14
  config: {'batch_size': 4, 'learning_rate': 0.0003, 'num_epochs': 10}
15
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:init():669] starting backend
16
- 2024-11-27 18:41:07,001 INFO MainThread:1986 [wandb_init.py:init():673] sending inform_init request
17
- 2024-11-27 18:41:07,003 INFO MainThread:1986 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
- 2024-11-27 18:41:07,003 INFO MainThread:1986 [wandb_init.py:init():686] backend started and connected
19
- 2024-11-27 18:41:07,015 INFO MainThread:1986 [wandb_run.py:_label_probe_notebook():1339] probe notebook
20
- 2024-11-27 18:41:08,226 INFO MainThread:1986 [wandb_init.py:init():781] updated telemetry
21
- 2024-11-27 18:41:08,230 INFO MainThread:1986 [wandb_init.py:init():814] communicating run to backend with 90.0 second timeout
22
- 2024-11-27 18:41:08,598 INFO MainThread:1986 [wandb_init.py:init():867] starting run threads in backend
23
- 2024-11-27 18:41:09,190 INFO MainThread:1986 [wandb_run.py:_console_start():2456] atexit reg
24
- 2024-11-27 18:41:09,191 INFO MainThread:1986 [wandb_run.py:_redirect():2305] redirect: wrap_raw
25
- 2024-11-27 18:41:09,191 INFO MainThread:1986 [wandb_run.py:_redirect():2370] Wrapping output streams.
26
- 2024-11-27 18:41:09,191 INFO MainThread:1986 [wandb_run.py:_redirect():2395] Redirects installed.
27
- 2024-11-27 18:41:09,195 INFO MainThread:1986 [wandb_init.py:init():911] run started, returning control to user process
28
- 2024-11-27 18:41:09,196 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
29
- 2024-11-27 18:41:09,196 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
30
- 2024-11-27 18:41:09,205 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
31
- 2024-11-27 18:41:09,207 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
32
- 2024-11-27 18:41:09,207 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
33
- 2024-11-27 18:41:09,214 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
34
- 2024-11-27 18:41:09,227 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
35
- 2024-11-27 18:41:09,228 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
36
- 2024-11-27 18:41:09,233 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
37
- 2024-11-27 18:41:10,595 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
38
- 2024-11-27 18:41:10,595 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
39
- 2024-11-27 18:41:10,863 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
40
- 2024-11-27 18:41:11,250 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb None None {'use_timm_backbone': True, 'backbone_config': None, 'num_channels': 3, 'num_queries': 100, 'd_model': 256, 'encoder_ffn_dim': 2048, 'encoder_layers': 6, 'encoder_attention_heads': 8, 'decoder_ffn_dim': 2048, 'decoder_layers': 6, 'decoder_attention_heads': 8, 'dropout': 0.1, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'activation_function': 'relu', 'init_std': 0.02, 'init_xavier_std': 1.0, 'encoder_layerdrop': 0.0, 'decoder_layerdrop': 0.0, 'num_hidden_layers': 6, 'auxiliary_loss': False, 'position_embedding_type': 'sine', 'backbone': 'resnet50', 'use_pretrained_backbone': True, 'backbone_kwargs': {'output_stride': 16, 'out_indices': [1, 2, 3, 4], 'in_chans': 3}, 'dilation': True, 'class_cost': 1, 'bbox_cost': 5, 'giou_cost': 2, 'mask_loss_coefficient': 1, 'dice_loss_coefficient': 1, 'bbox_loss_coefficient': 5, 'giou_loss_coefficient': 2, 'eos_coefficient': 0.1, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': True, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['DetrForObjectDetection'], 'finetuning_task': None, 'id2label': {0: 'object', 1: 'balloon'}, 'label2id': {'object': 0, 'balloon': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/detr-resnet-50-dc5', '_attn_implementation_autoset': True, 'transformers_version': '4.46.3', 'classifier_dropout': 0.0, 'max_position_embeddings': 1024, 'model_type': 'detr', 'scale_embedding': False, 'output_dir': '.', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0001, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': 250, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': './runs/Nov27_18-41-09_f5b68522d064', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 10, 'save_total_limit': 2, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 10, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '.', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': 'steps', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': True, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False}
41
- 2024-11-27 18:41:11,258 INFO MainThread:1986 [wandb_config.py:__setitem__():154] config set model/num_parameters = 41501895 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7caab878e680>>
42
- 2024-11-27 18:41:11,258 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
43
- 2024-11-27 18:46:20,059 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
44
- 2024-11-27 18:46:20,059 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
 
1
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Current SDK version is 0.18.7
2
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Configure stats pid to 2090
3
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from /root/.config/wandb/settings
4
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from /kaggle/working/wandb/settings
5
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from environment variables: {}
6
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
7
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program': '<python with no main file>'}
8
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Applying login settings: {}
9
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_log_setup():533] Logging user logs to /kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug.log
10
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_log_setup():534] Logging internal logs to /kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug-internal.log
11
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_jupyter_setup():479] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7f50757af550>
12
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():619] calling init triggers
13
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():626] wandb.init called with sweep_config: {}
14
  config: {'batch_size': 4, 'learning_rate': 0.0003, 'num_epochs': 10}
15
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():669] starting backend
16
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():673] sending inform_init request
17
+ 2024-11-27 18:49:14,420 INFO MainThread:2090 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-11-27 18:49:14,421 INFO MainThread:2090 [wandb_init.py:init():686] backend started and connected
19
+ 2024-11-27 18:49:14,433 INFO MainThread:2090 [wandb_run.py:_label_probe_notebook():1339] probe notebook
20
+ 2024-11-27 18:49:15,672 INFO MainThread:2090 [wandb_init.py:init():781] updated telemetry
21
+ 2024-11-27 18:49:15,675 INFO MainThread:2090 [wandb_init.py:init():814] communicating run to backend with 90.0 second timeout
22
+ 2024-11-27 18:49:16,004 INFO MainThread:2090 [wandb_init.py:init():867] starting run threads in backend
23
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_console_start():2456] atexit reg
24
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_redirect():2305] redirect: wrap_raw
25
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_redirect():2370] Wrapping output streams.
26
+ 2024-11-27 18:49:16,600 INFO MainThread:2090 [wandb_run.py:_redirect():2395] Redirects installed.
27
+ 2024-11-27 18:49:16,604 INFO MainThread:2090 [wandb_init.py:init():911] run started, returning control to user process
28
+ 2024-11-27 18:49:16,605 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
29
+ 2024-11-27 18:49:16,605 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
30
+ 2024-11-27 18:49:16,615 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
31
+ 2024-11-27 18:49:16,617 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
32
+ 2024-11-27 18:49:16,617 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
33
+ 2024-11-27 18:49:16,623 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
34
+ 2024-11-27 18:49:16,635 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
35
+ 2024-11-27 18:49:16,635 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
36
+ 2024-11-27 18:49:16,641 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
37
+ 2024-11-27 18:49:17,995 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
38
+ 2024-11-27 18:49:17,995 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
39
+ 2024-11-27 18:49:18,259 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
40
+ 2024-11-27 18:49:18,647 INFO MainThread:2090 [wandb_run.py:_config_callback():1387] config_cb None None {'use_timm_backbone': True, 'backbone_config': None, 'num_channels': 3, 'num_queries': 100, 'd_model': 256, 'encoder_ffn_dim': 2048, 'encoder_layers': 6, 'encoder_attention_heads': 8, 'decoder_ffn_dim': 2048, 'decoder_layers': 6, 'decoder_attention_heads': 8, 'dropout': 0.1, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'activation_function': 'relu', 'init_std': 0.02, 'init_xavier_std': 1.0, 'encoder_layerdrop': 0.0, 'decoder_layerdrop': 0.0, 'num_hidden_layers': 6, 'auxiliary_loss': False, 'position_embedding_type': 'sine', 'backbone': 'resnet50', 'use_pretrained_backbone': True, 'backbone_kwargs': {'output_stride': 16, 'out_indices': [1, 2, 3, 4], 'in_chans': 3}, 'dilation': True, 'class_cost': 1, 'bbox_cost': 5, 'giou_cost': 2, 'mask_loss_coefficient': 1, 'dice_loss_coefficient': 1, 'bbox_loss_coefficient': 5, 'giou_loss_coefficient': 2, 'eos_coefficient': 0.1, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': True, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['DetrForObjectDetection'], 'finetuning_task': None, 'id2label': {0: 'object', 1: 'balloon'}, 'label2id': {'object': 0, 'balloon': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/detr-resnet-50-dc5', '_attn_implementation_autoset': True, 'transformers_version': '4.46.3', 'classifier_dropout': 0.0, 'max_position_embeddings': 1024, 'model_type': 'detr', 'scale_embedding': False, 'output_dir': '.', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': 400, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': './runs/Nov27_18-49-17_f5b68522d064', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 10, 'save_total_limit': 2, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 10, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '.', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': 'steps', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': True, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False}
41
+ 2024-11-27 18:49:18,653 INFO MainThread:2090 [wandb_config.py:__setitem__():154] config set model/num_parameters = 41501895 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f507463aad0>>
42
+ 2024-11-27 18:49:18,653 INFO MainThread:2090 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
 
 
wandb/run-20241127_184106-b3av6kjn/files/config.yaml ADDED
@@ -0,0 +1,653 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _attn_implementation_autoset:
2
+ value: false
3
+ _name_or_path:
4
+ value: facebook/detr-resnet-50-dc5
5
+ _wandb:
6
+ value:
7
+ cli_version: 0.18.7
8
+ m:
9
+ - "1": eval/mar_large
10
+ "5": 2
11
+ "6":
12
+ - 1
13
+ - 3
14
+ "7": []
15
+ - "1": train/global_step
16
+ "6":
17
+ - 3
18
+ "7": []
19
+ - "1": eval/mar_medium
20
+ "5": 2
21
+ "6":
22
+ - 1
23
+ - 3
24
+ "7": []
25
+ - "1": eval/map_small
26
+ "5": 2
27
+ "6":
28
+ - 1
29
+ - 3
30
+ "7": []
31
+ - "1": train/grad_norm
32
+ "5": 2
33
+ "6":
34
+ - 1
35
+ - 3
36
+ "7": []
37
+ - "1": eval/map_50
38
+ "5": 2
39
+ "6":
40
+ - 1
41
+ - 3
42
+ "7": []
43
+ - "1": eval/mar_1
44
+ "5": 2
45
+ "6":
46
+ - 1
47
+ - 3
48
+ "7": []
49
+ - "1": eval/mar_100
50
+ "5": 2
51
+ "6":
52
+ - 1
53
+ - 3
54
+ "7": []
55
+ - "1": train/loss
56
+ "5": 2
57
+ "6":
58
+ - 1
59
+ - 3
60
+ "7": []
61
+ - "1": eval/map_medium
62
+ "5": 2
63
+ "6":
64
+ - 1
65
+ - 3
66
+ "7": []
67
+ - "1": eval/steps_per_second
68
+ "5": 2
69
+ "6":
70
+ - 1
71
+ - 3
72
+ "7": []
73
+ - "1": eval/map_75
74
+ "5": 2
75
+ "6":
76
+ - 1
77
+ - 3
78
+ "7": []
79
+ - "1": train/epoch
80
+ "5": 2
81
+ "6":
82
+ - 1
83
+ - 3
84
+ "7": []
85
+ - "1": eval/map_large
86
+ "5": 2
87
+ "6":
88
+ - 1
89
+ - 3
90
+ "7": []
91
+ - "1": eval/mar_10
92
+ "5": 2
93
+ "6":
94
+ - 1
95
+ - 3
96
+ "7": []
97
+ - "1": eval/map
98
+ "5": 2
99
+ "6":
100
+ - 1
101
+ - 3
102
+ "7": []
103
+ - "1": eval/samples_per_second
104
+ "5": 2
105
+ "6":
106
+ - 1
107
+ - 3
108
+ "7": []
109
+ - "1": eval/mar_small
110
+ "5": 2
111
+ "6":
112
+ - 1
113
+ - 3
114
+ "7": []
115
+ - "1": eval/runtime
116
+ "5": 2
117
+ "6":
118
+ - 1
119
+ - 3
120
+ "7": []
121
+ - "1": eval/loss
122
+ "5": 2
123
+ "6":
124
+ - 1
125
+ - 3
126
+ "7": []
127
+ - "1": train/learning_rate
128
+ "5": 2
129
+ "6":
130
+ - 1
131
+ - 3
132
+ "7": []
133
+ python_version: 3.10.14
134
+ t:
135
+ "1":
136
+ - 1
137
+ - 2
138
+ - 3
139
+ - 11
140
+ - 12
141
+ - 41
142
+ - 49
143
+ - 51
144
+ - 55
145
+ - 63
146
+ - 71
147
+ - 80
148
+ - 105
149
+ "2":
150
+ - 1
151
+ - 2
152
+ - 3
153
+ - 5
154
+ - 11
155
+ - 12
156
+ - 41
157
+ - 49
158
+ - 51
159
+ - 53
160
+ - 55
161
+ - 63
162
+ - 71
163
+ - 80
164
+ - 105
165
+ "3":
166
+ - 7
167
+ - 16
168
+ - 19
169
+ - 23
170
+ - 55
171
+ - 66
172
+ "4": 3.10.14
173
+ "5": 0.18.7
174
+ "6": 4.46.3
175
+ "8":
176
+ - 1
177
+ - 2
178
+ - 5
179
+ "9":
180
+ "1": transformers_trainer
181
+ "12": 0.18.7
182
+ "13": linux-x86_64
183
+ accelerator_config:
184
+ value:
185
+ dispatch_batches: null
186
+ even_batches: true
187
+ gradient_accumulation_kwargs: null
188
+ non_blocking: false
189
+ split_batches: false
190
+ use_seedable_sampler: true
191
+ activation_dropout:
192
+ value: 0
193
+ activation_function:
194
+ value: relu
195
+ adafactor:
196
+ value: false
197
+ adam_beta1:
198
+ value: 0.9
199
+ adam_beta2:
200
+ value: 0.999
201
+ adam_epsilon:
202
+ value: 1e-08
203
+ add_cross_attention:
204
+ value: false
205
+ architectures:
206
+ value:
207
+ - DetrForObjectDetection
208
+ attention_dropout:
209
+ value: 0
210
+ auto_find_batch_size:
211
+ value: false
212
+ auxiliary_loss:
213
+ value: false
214
+ average_tokens_across_devices:
215
+ value: false
216
+ backbone:
217
+ value: resnet50
218
+ backbone_config:
219
+ value: null
220
+ backbone_kwargs:
221
+ value:
222
+ in_chans: 3
223
+ out_indices:
224
+ - 1
225
+ - 2
226
+ - 3
227
+ - 4
228
+ output_stride: 16
229
+ bad_words_ids:
230
+ value: null
231
+ batch_eval_metrics:
232
+ value: true
233
+ batch_size:
234
+ value: 4
235
+ bbox_cost:
236
+ value: 5
237
+ bbox_loss_coefficient:
238
+ value: 5
239
+ begin_suppress_tokens:
240
+ value: null
241
+ bf16:
242
+ value: false
243
+ bf16_full_eval:
244
+ value: false
245
+ bos_token_id:
246
+ value: null
247
+ chunk_size_feed_forward:
248
+ value: 0
249
+ class_cost:
250
+ value: 1
251
+ classifier_dropout:
252
+ value: 0
253
+ cross_attention_hidden_size:
254
+ value: null
255
+ d_model:
256
+ value: 256
257
+ data_seed:
258
+ value: null
259
+ dataloader_drop_last:
260
+ value: false
261
+ dataloader_num_workers:
262
+ value: 0
263
+ dataloader_persistent_workers:
264
+ value: false
265
+ dataloader_pin_memory:
266
+ value: true
267
+ dataloader_prefetch_factor:
268
+ value: null
269
+ ddp_backend:
270
+ value: null
271
+ ddp_broadcast_buffers:
272
+ value: null
273
+ ddp_bucket_cap_mb:
274
+ value: null
275
+ ddp_find_unused_parameters:
276
+ value: null
277
+ ddp_timeout:
278
+ value: 1800
279
+ debug:
280
+ value: []
281
+ decoder_attention_heads:
282
+ value: 8
283
+ decoder_ffn_dim:
284
+ value: 2048
285
+ decoder_layerdrop:
286
+ value: 0
287
+ decoder_layers:
288
+ value: 6
289
+ decoder_start_token_id:
290
+ value: null
291
+ deepspeed:
292
+ value: null
293
+ dice_loss_coefficient:
294
+ value: 1
295
+ dilation:
296
+ value: true
297
+ disable_tqdm:
298
+ value: false
299
+ dispatch_batches:
300
+ value: null
301
+ diversity_penalty:
302
+ value: 0
303
+ do_eval:
304
+ value: true
305
+ do_predict:
306
+ value: false
307
+ do_sample:
308
+ value: false
309
+ do_train:
310
+ value: false
311
+ dropout:
312
+ value: 0.1
313
+ early_stopping:
314
+ value: false
315
+ encoder_attention_heads:
316
+ value: 8
317
+ encoder_ffn_dim:
318
+ value: 2048
319
+ encoder_layerdrop:
320
+ value: 0
321
+ encoder_layers:
322
+ value: 6
323
+ encoder_no_repeat_ngram_size:
324
+ value: 0
325
+ eos_coefficient:
326
+ value: 0.1
327
+ eos_token_id:
328
+ value: null
329
+ eval_accumulation_steps:
330
+ value: null
331
+ eval_delay:
332
+ value: 0
333
+ eval_do_concat_batches:
334
+ value: true
335
+ eval_on_start:
336
+ value: false
337
+ eval_steps:
338
+ value: 10
339
+ eval_strategy:
340
+ value: steps
341
+ eval_use_gather_object:
342
+ value: false
343
+ evaluation_strategy:
344
+ value: steps
345
+ exponential_decay_length_penalty:
346
+ value: null
347
+ finetuning_task:
348
+ value: null
349
+ forced_bos_token_id:
350
+ value: null
351
+ forced_eos_token_id:
352
+ value: null
353
+ fp16:
354
+ value: true
355
+ fp16_backend:
356
+ value: auto
357
+ fp16_full_eval:
358
+ value: false
359
+ fp16_opt_level:
360
+ value: O1
361
+ fsdp:
362
+ value: []
363
+ fsdp_config:
364
+ value:
365
+ min_num_params: 0
366
+ xla: false
367
+ xla_fsdp_grad_ckpt: false
368
+ xla_fsdp_v2: false
369
+ fsdp_min_num_params:
370
+ value: 0
371
+ fsdp_transformer_layer_cls_to_wrap:
372
+ value: null
373
+ full_determinism:
374
+ value: false
375
+ giou_cost:
376
+ value: 2
377
+ giou_loss_coefficient:
378
+ value: 2
379
+ gradient_accumulation_steps:
380
+ value: 1
381
+ gradient_checkpointing:
382
+ value: false
383
+ gradient_checkpointing_kwargs:
384
+ value: null
385
+ greater_is_better:
386
+ value: null
387
+ group_by_length:
388
+ value: false
389
+ half_precision_backend:
390
+ value: auto
391
+ hub_always_push:
392
+ value: false
393
+ hub_model_id:
394
+ value: null
395
+ hub_private_repo:
396
+ value: false
397
+ hub_strategy:
398
+ value: every_save
399
+ hub_token:
400
+ value: <HUB_TOKEN>
401
+ id2label:
402
+ value:
403
+ "0": object
404
+ "1": balloon
405
+ ignore_data_skip:
406
+ value: false
407
+ include_for_metrics:
408
+ value: []
409
+ include_inputs_for_metrics:
410
+ value: false
411
+ include_num_input_tokens_seen:
412
+ value: false
413
+ include_tokens_per_second:
414
+ value: false
415
+ init_std:
416
+ value: 0.02
417
+ init_xavier_std:
418
+ value: 1
419
+ is_decoder:
420
+ value: false
421
+ is_encoder_decoder:
422
+ value: true
423
+ jit_mode_eval:
424
+ value: false
425
+ label_names:
426
+ value: null
427
+ label_smoothing_factor:
428
+ value: 0
429
+ label2id:
430
+ value:
431
+ balloon: 1
432
+ object: 0
433
+ learning_rate:
434
+ value: 5e-05
435
+ length_column_name:
436
+ value: length
437
+ length_penalty:
438
+ value: 1
439
+ load_best_model_at_end:
440
+ value: false
441
+ local_rank:
442
+ value: 0
443
+ log_level:
444
+ value: passive
445
+ log_level_replica:
446
+ value: warning
447
+ log_on_each_node:
448
+ value: true
449
+ logging_dir:
450
+ value: ./runs/Nov27_18-46-25_f5b68522d064
451
+ logging_first_step:
452
+ value: false
453
+ logging_nan_inf_filter:
454
+ value: true
455
+ logging_steps:
456
+ value: 5
457
+ logging_strategy:
458
+ value: steps
459
+ lr_scheduler_type:
460
+ value: linear
461
+ mask_loss_coefficient:
462
+ value: 1
463
+ max_grad_norm:
464
+ value: 1
465
+ max_length:
466
+ value: 20
467
+ max_position_embeddings:
468
+ value: 1024
469
+ max_steps:
470
+ value: 250
471
+ metric_for_best_model:
472
+ value: null
473
+ min_length:
474
+ value: 0
475
+ model/num_parameters:
476
+ value: 41501895
477
+ model_type:
478
+ value: detr
479
+ mp_parameters:
480
+ value: ""
481
+ neftune_noise_alpha:
482
+ value: null
483
+ no_cuda:
484
+ value: false
485
+ no_repeat_ngram_size:
486
+ value: 0
487
+ num_beam_groups:
488
+ value: 1
489
+ num_beams:
490
+ value: 1
491
+ num_channels:
492
+ value: 3
493
+ num_epochs:
494
+ value: 10
495
+ num_hidden_layers:
496
+ value: 6
497
+ num_queries:
498
+ value: 100
499
+ num_return_sequences:
500
+ value: 1
501
+ num_train_epochs:
502
+ value: 3
503
+ optim:
504
+ value: adamw_torch
505
+ optim_args:
506
+ value: null
507
+ optim_target_modules:
508
+ value: null
509
+ output_attentions:
510
+ value: false
511
+ output_dir:
512
+ value: .
513
+ output_hidden_states:
514
+ value: false
515
+ output_scores:
516
+ value: false
517
+ overwrite_output_dir:
518
+ value: false
519
+ pad_token_id:
520
+ value: null
521
+ past_index:
522
+ value: -1
523
+ per_device_eval_batch_size:
524
+ value: 4
525
+ per_device_train_batch_size:
526
+ value: 4
527
+ per_gpu_eval_batch_size:
528
+ value: null
529
+ per_gpu_train_batch_size:
530
+ value: null
531
+ position_embedding_type:
532
+ value: sine
533
+ prediction_loss_only:
534
+ value: false
535
+ prefix:
536
+ value: null
537
+ problem_type:
538
+ value: null
539
+ push_to_hub:
540
+ value: true
541
+ push_to_hub_model_id:
542
+ value: null
543
+ push_to_hub_organization:
544
+ value: null
545
+ push_to_hub_token:
546
+ value: <PUSH_TO_HUB_TOKEN>
547
+ ray_scope:
548
+ value: last
549
+ remove_invalid_values:
550
+ value: false
551
+ remove_unused_columns:
552
+ value: false
553
+ repetition_penalty:
554
+ value: 1
555
+ report_to:
556
+ value:
557
+ - wandb
558
+ restore_callback_states_from_checkpoint:
559
+ value: false
560
+ resume_from_checkpoint:
561
+ value: null
562
+ return_dict:
563
+ value: true
564
+ return_dict_in_generate:
565
+ value: false
566
+ run_name:
567
+ value: .
568
+ save_on_each_node:
569
+ value: false
570
+ save_only_model:
571
+ value: false
572
+ save_safetensors:
573
+ value: true
574
+ save_steps:
575
+ value: 10
576
+ save_strategy:
577
+ value: steps
578
+ save_total_limit:
579
+ value: 2
580
+ scale_embedding:
581
+ value: false
582
+ seed:
583
+ value: 42
584
+ sep_token_id:
585
+ value: null
586
+ skip_memory_metrics:
587
+ value: true
588
+ split_batches:
589
+ value: null
590
+ suppress_tokens:
591
+ value: null
592
+ task_specific_params:
593
+ value: null
594
+ temperature:
595
+ value: 1
596
+ tf_legacy_loss:
597
+ value: false
598
+ tf32:
599
+ value: null
600
+ tie_encoder_decoder:
601
+ value: false
602
+ tie_word_embeddings:
603
+ value: true
604
+ tokenizer_class:
605
+ value: null
606
+ top_k:
607
+ value: 50
608
+ top_p:
609
+ value: 1
610
+ torch_compile:
611
+ value: false
612
+ torch_compile_backend:
613
+ value: null
614
+ torch_compile_mode:
615
+ value: null
616
+ torch_dtype:
617
+ value: float32
618
+ torch_empty_cache_steps:
619
+ value: null
620
+ torchdynamo:
621
+ value: null
622
+ torchscript:
623
+ value: false
624
+ tpu_metrics_debug:
625
+ value: false
626
+ tpu_num_cores:
627
+ value: null
628
+ transformers_version:
629
+ value: 4.46.3
630
+ typical_p:
631
+ value: 1
632
+ use_bfloat16:
633
+ value: false
634
+ use_cpu:
635
+ value: false
636
+ use_ipex:
637
+ value: false
638
+ use_legacy_prediction_loop:
639
+ value: false
640
+ use_liger_kernel:
641
+ value: false
642
+ use_mps_device:
643
+ value: false
644
+ use_pretrained_backbone:
645
+ value: true
646
+ use_timm_backbone:
647
+ value: true
648
+ warmup_ratio:
649
+ value: 0
650
+ warmup_steps:
651
+ value: 0
652
+ weight_decay:
653
+ value: 0.0001
wandb/run-20241127_184106-b3av6kjn/files/output.log CHANGED
@@ -6,3 +6,10 @@
6
  self.scaler = torch.cuda.amp.GradScaler(**kwargs)
7
  max_steps is given, it will override any value given in num_train_epochs
8
  wandb: WARNING The `run_name` is currently set to the same value as `TrainingArguments.output_dir`. If this was not intended, please specify a different run name by setting the `TrainingArguments.run_name` parameter.
 
 
 
 
 
 
 
 
6
  self.scaler = torch.cuda.amp.GradScaler(**kwargs)
7
  max_steps is given, it will override any value given in num_train_epochs
8
  wandb: WARNING The `run_name` is currently set to the same value as `TrainingArguments.output_dir`. If this was not intended, please specify a different run name by setting the `TrainingArguments.run_name` parameter.
9
+ /opt/conda/lib/python3.10/site-packages/transformers/training_args.py:1568: FutureWarning: `evaluation_strategy` is deprecated and will be removed in version 4.46 of 🤗 Transformers. Use `eval_strategy` instead
10
+ warnings.warn(
11
+ /tmp/ipykernel_1986/2368586458.py:28: FutureWarning: `tokenizer` is deprecated and will be removed in version 5.0.0 for `Trainer.__init__`. Use `processing_class` instead.
12
+ trainer = Trainer(
13
+ /opt/conda/lib/python3.10/site-packages/accelerate/accelerator.py:494: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
14
+ self.scaler = torch.cuda.amp.GradScaler(**kwargs)
15
+ max_steps is given, it will override any value given in num_train_epochs
wandb/run-20241127_184106-b3av6kjn/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"eval/loss":1.0323222875595093,"eval/runtime":3.2533,"eval/map":0.1805,"_runtime":306.314061416,"_timestamp":1.7327331735901072e+09,"train/loss":0.9611,"eval/map_large":0.28,"train/global_step":160,"train/grad_norm":29.917068481445312,"_wandb":{"runtime":315},"_step":47,"eval/map_medium":0.1997,"train/learning_rate":3.9200000000000004e-05,"eval/mar_10":0.3412,"eval/mar_small":0,"eval/samples_per_second":3.689,"eval/map_50":0.2457,"eval/mar_medium":0.6316,"eval/map_75":0.2118,"eval/map_small":0,"eval/mar_100":0.6618,"eval/mar_large":0.8077,"eval/mar_1":0.0971,"train/epoch":12.307692307692308,"eval/steps_per_second":0.922}
wandb/run-20241127_184106-b3av6kjn/logs/debug-core.log CHANGED
@@ -5,3 +5,10 @@
5
  {"time":"2024-11-27T18:41:06.874677222Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:42940"}
6
  {"time":"2024-11-27T18:41:07.005615036Z","level":"INFO","msg":"handleInformInit: received","streamId":"b3av6kjn","id":"127.0.0.1:42940"}
7
  {"time":"2024-11-27T18:41:07.108964635Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"b3av6kjn","id":"127.0.0.1:42940"}
 
 
 
 
 
 
 
 
5
  {"time":"2024-11-27T18:41:06.874677222Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:42940"}
6
  {"time":"2024-11-27T18:41:07.005615036Z","level":"INFO","msg":"handleInformInit: received","streamId":"b3av6kjn","id":"127.0.0.1:42940"}
7
  {"time":"2024-11-27T18:41:07.108964635Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"b3av6kjn","id":"127.0.0.1:42940"}
8
+ {"time":"2024-11-27T18:46:59.940406578Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"127.0.0.1:42940"}
9
+ {"time":"2024-11-27T18:46:59.94059889Z","level":"INFO","msg":"connection: Close: initiating connection closure","id":"127.0.0.1:42940"}
10
+ {"time":"2024-11-27T18:46:59.941846038Z","level":"INFO","msg":"connection: Close: connection successfully closed","id":"127.0.0.1:42940"}
11
+ {"time":"2024-11-27T18:46:59.940634315Z","level":"INFO","msg":"server is shutting down"}
12
+ {"time":"2024-11-27T18:47:00.514632054Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"127.0.0.1:42940"}
13
+ {"time":"2024-11-27T18:47:00.514671793Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"127.0.0.1:42940"}
14
+ {"time":"2024-11-27T18:47:00.514696726Z","level":"INFO","msg":"server is closed"}
wandb/run-20241127_184106-b3av6kjn/logs/debug-internal.log CHANGED
@@ -15,3 +15,20 @@
15
  {"time":"2024-11-27T18:41:10.596026715Z","level":"INFO","msg":"Pausing system monitor"}
16
  {"time":"2024-11-27T18:41:10.864229971Z","level":"INFO","msg":"Resuming system monitor"}
17
  {"time":"2024-11-27T18:46:20.059842369Z","level":"INFO","msg":"Pausing system monitor"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  {"time":"2024-11-27T18:41:10.596026715Z","level":"INFO","msg":"Pausing system monitor"}
16
  {"time":"2024-11-27T18:41:10.864229971Z","level":"INFO","msg":"Resuming system monitor"}
17
  {"time":"2024-11-27T18:46:20.059842369Z","level":"INFO","msg":"Pausing system monitor"}
18
+ {"time":"2024-11-27T18:46:25.045944442Z","level":"INFO","msg":"Resuming system monitor"}
19
+ {"time":"2024-11-27T18:46:25.048772709Z","level":"INFO","msg":"Pausing system monitor"}
20
+ {"time":"2024-11-27T18:46:25.369840673Z","level":"INFO","msg":"Resuming system monitor"}
21
+ {"time":"2024-11-27T18:46:25.551999838Z","level":"INFO","msg":"Pausing system monitor"}
22
+ {"time":"2024-11-27T18:46:25.956088136Z","level":"INFO","msg":"Resuming system monitor"}
23
+ {"time":"2024-11-27T18:46:28.327308539Z","level":"INFO","msg":"Pausing system monitor"}
24
+ {"time":"2024-11-27T18:46:59.940516874Z","level":"INFO","msg":"stream: closing","id":"b3av6kjn"}
25
+ {"time":"2024-11-27T18:46:59.940566248Z","level":"INFO","msg":"Stopping system monitor"}
26
+ {"time":"2024-11-27T18:46:59.941409519Z","level":"INFO","msg":"Stopped system monitor"}
27
+ {"time":"2024-11-27T18:47:00.163412552Z","level":"WARN","msg":"No job ingredients found, not creating job artifact"}
28
+ {"time":"2024-11-27T18:47:00.163440799Z","level":"WARN","msg":"No source type found, not creating job artifact"}
29
+ {"time":"2024-11-27T18:47:00.163450516Z","level":"INFO","msg":"sender: sendDefer: no job artifact to save"}
30
+ {"time":"2024-11-27T18:47:00.404989002Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
31
+ {"time":"2024-11-27T18:47:00.51432732Z","level":"INFO","msg":"handler: closed","stream_id":"b3av6kjn"}
32
+ {"time":"2024-11-27T18:47:00.514390088Z","level":"INFO","msg":"sender: closed","stream_id":"b3av6kjn"}
33
+ {"time":"2024-11-27T18:47:00.514385813Z","level":"INFO","msg":"writer: Close: closed","stream_id":"b3av6kjn"}
34
+ {"time":"2024-11-27T18:47:00.514498408Z","level":"INFO","msg":"stream: closed","id":"b3av6kjn"}
wandb/run-20241127_184106-b3av6kjn/logs/debug.log CHANGED
@@ -42,3 +42,16 @@ config: {'batch_size': 4, 'learning_rate': 0.0003, 'num_epochs': 10}
42
  2024-11-27 18:41:11,258 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
43
  2024-11-27 18:46:20,059 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
44
  2024-11-27 18:46:20,059 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  2024-11-27 18:41:11,258 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
43
  2024-11-27 18:46:20,059 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
44
  2024-11-27 18:46:20,059 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
45
+ 2024-11-27 18:46:25,045 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
46
+ 2024-11-27 18:46:25,048 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
47
+ 2024-11-27 18:46:25,048 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
48
+ 2024-11-27 18:46:25,369 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
49
+ 2024-11-27 18:46:25,551 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
50
+ 2024-11-27 18:46:25,551 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
51
+ 2024-11-27 18:46:25,955 INFO MainThread:1986 [wandb_init.py:_resume_backend():449] resuming backend
52
+ 2024-11-27 18:46:26,472 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb None None {'use_timm_backbone': True, 'backbone_config': None, 'num_channels': 3, 'num_queries': 100, 'd_model': 256, 'encoder_ffn_dim': 2048, 'encoder_layers': 6, 'encoder_attention_heads': 8, 'decoder_ffn_dim': 2048, 'decoder_layers': 6, 'decoder_attention_heads': 8, 'dropout': 0.1, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'activation_function': 'relu', 'init_std': 0.02, 'init_xavier_std': 1.0, 'encoder_layerdrop': 0.0, 'decoder_layerdrop': 0.0, 'num_hidden_layers': 6, 'auxiliary_loss': False, 'position_embedding_type': 'sine', 'backbone': 'resnet50', 'use_pretrained_backbone': True, 'backbone_kwargs': {'output_stride': 16, 'out_indices': [1, 2, 3, 4], 'in_chans': 3}, 'dilation': True, 'class_cost': 1, 'bbox_cost': 5, 'giou_cost': 2, 'mask_loss_coefficient': 1, 'dice_loss_coefficient': 1, 'bbox_loss_coefficient': 5, 'giou_loss_coefficient': 2, 'eos_coefficient': 0.1, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': 'float32', 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': True, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['DetrForObjectDetection'], 'finetuning_task': None, 'id2label': {0: 'object', 1: 'balloon'}, 'label2id': {'object': 0, 'balloon': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/detr-resnet-50-dc5', '_attn_implementation_autoset': False, 'transformers_version': '4.46.3', 'classifier_dropout': 0.0, 'max_position_embeddings': 1024, 'model_type': 'detr', 'scale_embedding': False, 'output_dir': '.', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': 250, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': './runs/Nov27_18-46-25_f5b68522d064', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 10, 'save_total_limit': 2, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 10, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '.', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': 'steps', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': True, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False}
53
+ 2024-11-27 18:46:26,477 INFO MainThread:1986 [wandb_config.py:__setitem__():154] config set model/num_parameters = 41501895 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7caab878e680>>
54
+ 2024-11-27 18:46:26,478 INFO MainThread:1986 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
55
+ 2024-11-27 18:46:28,326 INFO MainThread:1986 [jupyter.py:save_ipynb():387] not saving jupyter notebook
56
+ 2024-11-27 18:46:28,326 INFO MainThread:1986 [wandb_init.py:_pause_backend():444] pausing backend
57
+ 2024-11-27 18:46:59,941 WARNING MsgRouterThr:1986 [router.py:message_loop():75] message_loop has been closed
wandb/run-20241127_184106-b3av6kjn/run-b3av6kjn.wandb CHANGED
Binary files a/wandb/run-20241127_184106-b3av6kjn/run-b3av6kjn.wandb and b/wandb/run-20241127_184106-b3av6kjn/run-b3av6kjn.wandb differ
 
wandb/run-20241127_184914-lig8s4o3/files/output.log ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ /opt/conda/lib/python3.10/site-packages/transformers/training_args.py:1568: FutureWarning: `evaluation_strategy` is deprecated and will be removed in version 4.46 of 🤗 Transformers. Use `eval_strategy` instead
2
+ warnings.warn(
3
+ /tmp/ipykernel_2090/2368586458.py:28: FutureWarning: `tokenizer` is deprecated and will be removed in version 5.0.0 for `Trainer.__init__`. Use `processing_class` instead.
4
+ trainer = Trainer(
5
+ /opt/conda/lib/python3.10/site-packages/accelerate/accelerator.py:494: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.
6
+ self.scaler = torch.cuda.amp.GradScaler(**kwargs)
7
+ max_steps is given, it will override any value given in num_train_epochs
8
+ wandb: WARNING The `run_name` is currently set to the same value as `TrainingArguments.output_dir`. If this was not intended, please specify a different run name by setting the `TrainingArguments.run_name` parameter.
wandb/run-20241127_184914-lig8s4o3/files/requirements.txt ADDED
@@ -0,0 +1,791 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ brotlipy==0.7.0
2
+ PySocks==1.7.1
3
+ conda-content-trust==0+unknown
4
+ six==1.16.0
5
+ ruamel-yaml-conda==0.15.100
6
+ evaluate==0.4.3
7
+ wandb==0.18.7
8
+ simsimd==6.2.1
9
+ transformers==4.46.3
10
+ datasets==3.1.0
11
+ timm==1.0.11
12
+ torchmetrics==1.6.0
13
+ pycocotools==2.0.8
14
+ stringzilla==3.10.10
15
+ matplotlib==3.9.2
16
+ albumentations==1.4.21
17
+ albucore==0.0.20
18
+ jupyter-lsp==1.5.1
19
+ packaging==21.3
20
+ jupyter_server==2.12.5
21
+ Wand==0.6.13
22
+ pytesseract==0.3.13
23
+ pypdf==5.0.1
24
+ pdf2image==1.17.0
25
+ kaggle-environments==1.14.15
26
+ safetensors==0.4.5
27
+ py-cpuinfo==9.0.0
28
+ qgrid==1.3.1
29
+ woodwork==0.31.0
30
+ gcsfs==2024.6.1
31
+ google-auth-httplib2==0.2.0
32
+ onnx==1.17.0
33
+ pytorch-ignite==0.5.1
34
+ MarkupSafe==2.1.5
35
+ sentry-sdk==2.15.0
36
+ torchinfo==1.8.0
37
+ ndindex==1.9.2
38
+ learntools==0.3.4
39
+ s3fs==2024.6.1
40
+ eval_type_backport==0.2.0
41
+ aiobotocore==2.15.1
42
+ featuretools==1.31.0
43
+ plotly-express==0.4.1
44
+ aiohttp==3.9.5
45
+ easyocr==1.7.2
46
+ slicer==0.0.7
47
+ pyemd==1.0.0
48
+ tsfresh==0.20.3
49
+ vec_noise==1.1.4
50
+ pandasql==0.7.3
51
+ setproctitle==1.3.3
52
+ multiprocess==0.70.16
53
+ opencv-python-headless==4.10.0.84
54
+ gymnasium==0.29.0
55
+ openpyxl==3.1.5
56
+ cesium==0.12.3
57
+ shap==0.44.1
58
+ watchdog==5.0.3
59
+ google-api-python-client==2.147.0
60
+ ghapi==1.0.6
61
+ jieba==0.42.1
62
+ alembic==1.13.3
63
+ docker-pycreds==0.4.0
64
+ scipy==1.14.1
65
+ blinker==1.8.2
66
+ nbdev==2.3.31
67
+ bqplot==0.12.43
68
+ pydub==0.25.1
69
+ python-bidi==0.6.0
70
+ pycryptodome==3.20.0
71
+ tables==3.10.1
72
+ ninja==1.11.1.1
73
+ tokenizers==0.20.0
74
+ pydegensac==0.1.2
75
+ pyclipper==1.3.0.post5
76
+ blosc2==2.7.1
77
+ PyArabic==0.6.15
78
+ fastai==2.7.17
79
+ gym-notices==0.0.8
80
+ itsdangerous==2.2.0
81
+ numpy==1.26.4
82
+ Werkzeug==3.0.4
83
+ traittypes==0.2.1
84
+ optuna==4.0.0
85
+ Pympler==1.1
86
+ scikit-learn==1.2.2
87
+ numba==0.60.0
88
+ pytorch-lightning==2.4.0
89
+ colorlog==6.8.2
90
+ gym==0.26.2
91
+ execnb==0.1.6
92
+ llvmlite==0.43.0
93
+ llvmlite==0.43.0
94
+ earthengine-api==1.1.2
95
+ pettingzoo==1.24.0
96
+ segment_anything==1.0
97
+ aioitertools==0.12.0
98
+ rgf-python==3.12.0
99
+ Flask==3.0.3
100
+ stable-baselines3==2.1.0
101
+ lightning-utilities==0.11.7
102
+ huggingface-hub==0.25.1
103
+ et-xmlfile==1.1.0
104
+ accelerate==0.34.2
105
+ Shapely==1.8.5.post1
106
+ shapely==2.0.6
107
+ Shimmy==1.3.0
108
+ stumpy==1.13.0
109
+ Rtree==1.3.0
110
+ fsspec==2024.6.1
111
+ fsspec==2024.9.0
112
+ fastcore==1.7.10
113
+ fastdownload==0.0.7
114
+ gatspy==0.3
115
+ botocore==1.35.23
116
+ dill==0.3.8
117
+ google-cloud-bigquery==2.34.4
118
+ google-cloud-videointelligence==2.13.5
119
+ google-api-core==2.11.1
120
+ google-api-core==2.20.0
121
+ google-cloud-aiplatform==0.6.0a1
122
+ google-cloud-monitoring==2.21.0
123
+ google-auth==2.30.0
124
+ google-cloud-automl==1.0.1
125
+ google-cloud-storage==1.44.0
126
+ googleapis-common-protos==1.63.1
127
+ google-cloud-translate==3.12.1
128
+ google-cloud-core==2.4.1
129
+ google-generativeai==0.8.2
130
+ google-cloud-vision==2.8.0
131
+ google-cloud-datastore==2.20.1
132
+ google-cloud-artifact-registry==1.11.3
133
+ google-cloud-language==2.14.0
134
+ en-core-web-sm==3.7.1
135
+ en-core-web-lg==3.7.1
136
+ docstring-to-markdown==0.15
137
+ jupyterlab-lsp==5.1.0
138
+ traceml==1.0.8
139
+ qtconsole==5.6.0
140
+ ipywidgets==7.7.1
141
+ pytoolconfig==1.3.1
142
+ rope==1.13.0
143
+ async-lru==2.0.4
144
+ datatile==1.0.3
145
+ pydocstyle==6.3.0
146
+ QtPy==2.4.1
147
+ isort==5.13.2
148
+ tomlkit==0.13.2
149
+ olefile==0.47
150
+ mccabe==0.7.0
151
+ pylint==3.3.1
152
+ jupyter-console==6.6.3
153
+ astroid==3.3.4
154
+ yapf==0.40.2
155
+ jupyterlab==4.2.5
156
+ flake8==7.1.1
157
+ whatthepatch==1.0.6
158
+ pyflakes==3.2.0
159
+ pandas-summary==0.2.0
160
+ nbconvert==6.4.5
161
+ testpath==0.6.0
162
+ nbclient==0.5.13
163
+ python-lsp-server==1.12.0
164
+ kornia==0.7.3
165
+ snowballstemmer==2.2.0
166
+ python-lsp-jsonrpc==1.1.2
167
+ autopep8==2.0.4
168
+ pycodestyle==2.12.1
169
+ isoweek==1.3.3
170
+ widgetsnbextension==3.6.9
171
+ kornia_rs==0.1.5
172
+ mistune==0.8.4
173
+ openslide-python==1.3.1
174
+ html5lib==1.1
175
+ ppft==1.7.6.9
176
+ pathos==0.3.3
177
+ pox==0.3.5
178
+ pandas-datareader==0.10.0
179
+ category-encoders==2.6.4
180
+ mlcrate==0.2.0
181
+ Janome==0.5.0
182
+ annoy==1.17.3
183
+ yellowbrick==1.5
184
+ emoji==2.13.2
185
+ librosa==0.10.2.post1
186
+ soxr==0.5.0.post1
187
+ memory-profiler==0.61.0
188
+ sentencepiece==0.2.0
189
+ audioread==3.0.1
190
+ cufflinks==0.17.3
191
+ soundfile==0.12.1
192
+ lime==0.2.0.1
193
+ colorlover==0.3.0
194
+ CVXcanon==0.1.2
195
+ sklearn-pandas==2.2.0
196
+ scikit-multilearn==0.2.0
197
+ path==17.0.0
198
+ odfpy==1.4.1
199
+ mpld3==0.5.10
200
+ kaggle==1.6.17
201
+ narwhals==1.9.0
202
+ fury==0.11.0
203
+ xarray-einstats==0.8.0
204
+ scikit-surprise==1.1.4
205
+ ydata-profiling==4.10.0
206
+ panel==1.5.1
207
+ plotnine==0.13.6
208
+ py4j==0.10.9.7
209
+ fuzzywuzzy==0.18.0
210
+ fastprogress==1.0.3
211
+ update-checker==0.18.0
212
+ missingno==0.5.2
213
+ catboost==1.2.7
214
+ pyexcel-io==0.6.6
215
+ stopit==1.1.2
216
+ arviz==0.20.0
217
+ branca==0.8.0
218
+ mizani==0.11.4
219
+ nltk==3.2.4
220
+ semver==3.0.2
221
+ SimpleITK==2.4.0
222
+ TPOT==0.12.1
223
+ nibabel==5.2.1
224
+ folium==0.17.0
225
+ gpxpy==1.6.2
226
+ bayesian-optimization==1.5.1
227
+ hyperopt==0.2.7
228
+ python-louvain==0.16
229
+ orderly-set==5.2.2
230
+ typing-inspect==0.9.0
231
+ ecos==2.0.14
232
+ lxml==5.3.0
233
+ trx-python==0.3
234
+ iniconfig==2.0.0
235
+ leven==1.0.4
236
+ path.py==12.5.0
237
+ pymc3==3.11.4
238
+ wavio==0.0.9
239
+ lml==0.1.0
240
+ deap==1.4.1
241
+ marshmallow==3.22.0
242
+ pygltflib==1.16.2
243
+ numexpr==2.10.1
244
+ pyLDAvis==3.4.1
245
+ python-slugify==8.0.4
246
+ pydantic==2.9.2
247
+ langid==1.1.6
248
+ setuptools-scm==8.1.0
249
+ geojson==3.1.0
250
+ scikit-plot==0.3.7
251
+ holidays==0.57
252
+ nose==1.3.7
253
+ pytest==8.3.3
254
+ google-ai-generativelanguage==0.6.10
255
+ text-unidecode==1.3
256
+ Theano-PyMC==1.1.2
257
+ dipy==1.9.0
258
+ h5netcdf==1.3.0
259
+ funcy==2.0
260
+ holoviews==1.19.1
261
+ stanio==0.5.1
262
+ squarify==0.4.4
263
+ mlxtend==0.23.1
264
+ future==1.0.0
265
+ dataclasses-json==0.6.7
266
+ prophet==1.1.5
267
+ imgaug==0.4.0
268
+ nilearn==0.10.4
269
+ deepdiff==8.0.1
270
+ eli5==0.13.0
271
+ pyviz_comms==3.0.3
272
+ pydicom==3.0.1
273
+ mypy-extensions==1.0.0
274
+ haversine==2.8.1
275
+ sphinx-rtd-theme==0.2.4
276
+ altair==5.4.1
277
+ cmdstanpy==1.2.4
278
+ pyexcel-ods==0.6.0
279
+ preprocessing==0.1.13
280
+ matplotlib-venn==1.1.1
281
+ pyaml==24.9.0
282
+ scikit-optimize==0.10.2
283
+ vtk==9.3.1
284
+ xvfbwrapper==0.2.9
285
+ urwid_readline==0.15.1
286
+ scikit-learn-intelex==2024.7.0
287
+ Boruta==0.4.3
288
+ pybind11==2.13.6
289
+ line_profiler==4.1.3
290
+ datashader==0.16.3
291
+ fasttext==0.9.3
292
+ s3transfer==0.6.2
293
+ param==2.1.1
294
+ pudb==2024.1.2
295
+ jmespath==1.0.1
296
+ xarray==2024.9.0
297
+ colorcet==3.1.0
298
+ urwid==2.6.15
299
+ boto3==1.26.100
300
+ imbalanced-learn==0.12.3
301
+ daal4py==2024.7.0
302
+ daal==2024.7.0
303
+ libpysal==4.9.2
304
+ pyct==0.5.0
305
+ tbb==2021.13.1
306
+ gensim==4.3.3
307
+ textblob==0.18.0.post0
308
+ xgboost==2.0.3
309
+ opencv-python==4.10.0.84
310
+ Theano==1.0.5
311
+ hep-ml==0.7.2
312
+ opencv-contrib-python==4.10.0.84
313
+ kagglehub==0.3.1
314
+ keras-core==0.1.7
315
+ keras-nlp==0.15.1
316
+ tensorflow_decision_forests==1.9.1
317
+ wurlitzer==3.1.1
318
+ tensorflow-text==2.16.1
319
+ ydf==0.8.0
320
+ keras-cv==0.9.0
321
+ h2o==3.46.0.5
322
+ polars==1.9.0
323
+ pooch==1.8.2
324
+ igraph==0.11.6
325
+ optax==0.2.2
326
+ orbax-checkpoint==0.6.4
327
+ flax==0.8.4
328
+ chex==0.1.86
329
+ tensorstore==0.1.66
330
+ dask-expr==1.1.15
331
+ python-dateutil==2.9.0.post0
332
+ geographiclib==2.0
333
+ PyUpSet==0.1.1.post7
334
+ pandas==2.2.3
335
+ pandas==2.2.2
336
+ cloudpickle==3.0.0
337
+ ipympl==0.7.0
338
+ PyYAML==6.0.2
339
+ texttable==1.7.0
340
+ geopy==2.4.1
341
+ dask==2024.9.1
342
+ mne==1.8.0
343
+ pynvrtc==9.2
344
+ pycuda==2024.1.2
345
+ pytools==2024.1.14
346
+ Mako==1.3.5
347
+ jaxlib==0.4.26.dev20240620
348
+ jax==0.4.26
349
+ lightgbm==4.2.0
350
+ torchaudio==2.4.0
351
+ torch==2.4.0
352
+ mpmath==1.3.0
353
+ sympy==1.13.3
354
+ torchvision==0.19.0
355
+ pynvml==11.4.1
356
+ annotated-types==0.7.0
357
+ srsly==2.4.8
358
+ catalogue==2.0.10
359
+ partd==1.4.2
360
+ langcodes==3.4.1
361
+ preshed==3.0.9
362
+ pytz==2024.2
363
+ pytz==2024.1
364
+ pynvjitlink-cu12==0.3.0
365
+ spacy-legacy==3.0.12
366
+ spacy==3.7.6
367
+ murmurhash==1.0.10
368
+ thinc==8.2.5
369
+ language_data==1.2.0
370
+ blis==0.7.10
371
+ pydantic_core==2.23.4
372
+ grpcio==1.62.2
373
+ grpcio==1.64.1
374
+ raft-dask==24.8.1
375
+ msgpack==1.1.0
376
+ msgpack==1.0.8
377
+ distributed==2024.7.1
378
+ wrapt==1.16.0
379
+ pylibraft==24.8.1
380
+ cymem==2.0.8
381
+ nvtx==0.2.10
382
+ spacy-loggers==1.0.5
383
+ wasabi==1.1.2
384
+ pyarrow==16.1.0
385
+ cupy==13.3.0
386
+ zict==3.0.0
387
+ bokeh==3.5.2
388
+ dask-cudf==24.8.3
389
+ treelite==4.3.0
390
+ xyzservices==2024.9.0
391
+ cuml==24.8.0
392
+ shellingham==1.5.4
393
+ proto-plus==1.23.0
394
+ locket==1.0.0
395
+ tzdata==2024.2
396
+ tzdata==2024.1
397
+ typer-slim==0.12.5
398
+ pyarrow-hotfix==0.6
399
+ toolz==0.12.1
400
+ rapids-dask-dependency==24.8.0a0
401
+ rmm==24.8.2
402
+ markdown-it-py==3.0.0
403
+ fastrlock==0.8.2
404
+ mdurl==0.1.2
405
+ weasel==0.4.1
406
+ rich==13.9.1
407
+ rich==13.7.1
408
+ cudf==24.8.3
409
+ confection==0.1.4
410
+ tblib==3.0.0
411
+ joblib==1.4.2
412
+ cuda-python==12.6.0
413
+ typer==0.12.5
414
+ typer==0.12.3
415
+ marisa-trie==1.1.0
416
+ distributed-ucxx==0.39.1
417
+ cloudpathlib==0.19.0
418
+ ucx-py==0.39.2
419
+ cytoolz==0.12.3
420
+ smart_open==7.0.4
421
+ click==8.1.7
422
+ dask-cuda==24.8.2
423
+ protobuf==4.25.3
424
+ protobuf==3.20.3
425
+ ucxx==0.39.1
426
+ sortedcontainers==2.4.0
427
+ lz4==4.3.3
428
+ pyparsing==3.1.4
429
+ pyparsing==3.1.2
430
+ zstandard==0.23.0
431
+ unicodedata2==15.1.0
432
+ fonttools==4.54.1
433
+ fonttools==4.53.0
434
+ pyshp==2.3.1
435
+ pillow==10.4.0
436
+ pillow==10.3.0
437
+ cycler==0.12.1
438
+ conda==24.9.0
439
+ certifi==2024.8.30
440
+ pyproj==3.7.0
441
+ pyproj==3.6.1
442
+ libmambapy==1.5.10
443
+ Cartopy==0.23.0
444
+ contourpy==1.3.0
445
+ contourpy==1.2.1
446
+ munkres==1.1.4
447
+ kiwisolver==1.4.7
448
+ kiwisolver==1.4.5
449
+ mamba==1.5.10
450
+ conda-libmamba-solver==23.12.0
451
+ graphviz==0.20.3
452
+ pycparser==2.22
453
+ nbdime==3.2.0
454
+ astunparse==1.6.3
455
+ fastapi-cli==0.0.4
456
+ jsonschema-specifications==2023.12.1
457
+ pandocfilters==1.5.0
458
+ opentelemetry-exporter-otlp==1.25.0
459
+ libclang==18.1.1
460
+ h11==0.14.0
461
+ grpc-google-iam-v1==0.12.7
462
+ rpds-py==0.18.1
463
+ jupyterlab_pygments==0.3.0
464
+ tensorflow-hub==0.16.1
465
+ cryptography==42.0.8
466
+ requests-oauthlib==2.0.0
467
+ pydata-google-auth==1.8.2
468
+ overrides==7.7.0
469
+ ipython-genutils==0.2.0
470
+ y-py==0.6.2
471
+ opentelemetry-proto==1.25.0
472
+ greenlet==3.0.3
473
+ nvidia-ml-py==11.495.46
474
+ tensorflow==2.16.1
475
+ PyJWT==2.8.0
476
+ time-machine==2.14.1
477
+ Cython==3.0.10
478
+ tensorflow-probability==0.24.0
479
+ click-plugins==1.1.1
480
+ google-cloud-pubsub==2.21.3
481
+ jupyter_core==5.7.2
482
+ webcolors==24.6.0
483
+ jupyterlab_server==2.27.2
484
+ grpcio-status==1.48.0
485
+ grpcio-status==1.48.2
486
+ fqdn==1.5.1
487
+ jeepney==0.8.0
488
+ google-cloud-recommendations-ai==0.7.1
489
+ httptools==0.6.1
490
+ ipython-sql==0.5.0
491
+ toml==0.10.2
492
+ ipykernel==6.29.4
493
+ tensorboardX==2.6.2.2
494
+ objsize==0.6.1
495
+ patsy==0.5.6
496
+ immutabledict==4.2.0
497
+ Jinja2==3.1.4
498
+ requests-toolbelt==0.10.1
499
+ statsmodels==0.14.2
500
+ tenacity==8.3.0
501
+ platformdirs==3.11.0
502
+ platformdirs==4.2.2
503
+ google-cloud-iam==2.15.0
504
+ typeguard==4.3.0
505
+ jupyter_server_terminals==0.5.3
506
+ httpcore==1.0.5
507
+ ipython==8.21.0
508
+ ipython==8.25.0
509
+ google-cloud-resource-manager==1.12.3
510
+ tensorflow-estimator==2.15.0
511
+ idna==3.7
512
+ pandas-profiling==3.6.6
513
+ tensorflow-cloud==0.1.16
514
+ distlib==0.3.8
515
+ lazy_loader==0.4
516
+ termcolor==2.4.0
517
+ tensorflow-datasets==4.9.6
518
+ importlib_resources==6.4.0
519
+ opentelemetry-exporter-otlp-proto-grpc==1.25.0
520
+ jupyter-ydoc==0.2.5
521
+ aiofiles==22.1.0
522
+ wordcloud==1.9.3
523
+ opencensus==0.11.4
524
+ jupyterlab_git==0.44.0
525
+ truststore==0.8.0
526
+ linkify-it-py==2.0.3
527
+ isoduration==20.11.0
528
+ google-cloud-bigquery-connection==1.15.3
529
+ setuptools==70.0.0
530
+ opentelemetry-semantic-conventions==0.46b0
531
+ cffi==1.16.0
532
+ pure-eval==0.2.2
533
+ webencodings==0.5.1
534
+ orjson==3.10.4
535
+ wheel==0.43.0
536
+ multidict==6.0.5
537
+ starlette==0.37.2
538
+ ml-dtypes==0.3.2
539
+ Deprecated==1.2.14
540
+ ImageHash==4.3.1
541
+ parso==0.8.4
542
+ psutil==5.9.3
543
+ psutil==5.9.8
544
+ stack-data==0.6.2
545
+ stack-data==0.6.3
546
+ virtualenv==20.21.0
547
+ entrypoints==0.4
548
+ opentelemetry-api==1.25.0
549
+ GitPython==3.1.43
550
+ oauthlib==3.2.2
551
+ jupyter_server_fileid==0.9.2
552
+ smmap==5.0.1
553
+ tensorflow-serving-api==2.16.1
554
+ kernels-mixer==0.0.13
555
+ jedi==0.19.1
556
+ argon2-cffi-bindings==21.2.0
557
+ namex==0.0.8
558
+ textual==0.67.1
559
+ h5py==3.11.0
560
+ pip==24.0
561
+ argon2-cffi==23.1.0
562
+ attrs==23.2.0
563
+ uri-template==1.3.0
564
+ multimethod==1.11.2
565
+ zipp==3.19.2
566
+ menuinst==2.1.1
567
+ pydot==1.4.2
568
+ defusedxml==0.7.1
569
+ decorator==5.1.1
570
+ fastjsonschema==2.19.1
571
+ asttokens==2.4.1
572
+ uvloop==0.19.0
573
+ Markdown==3.6
574
+ google-pasta==0.2.0
575
+ tensorboard_plugin_profile==2.15.1
576
+ parsy==2.1
577
+ google-cloud-jupyter-config==0.0.10
578
+ absl-py==1.4.0
579
+ prometheus_client==0.20.0
580
+ opt-einsum==3.3.0
581
+ charset-normalizer==3.3.2
582
+ kfp-server-api==2.0.5
583
+ ray-cpp==2.24.0
584
+ kfp-pipeline-spec==0.2.2
585
+ appdirs==1.4.4
586
+ google-resumable-media==2.7.1
587
+ pluggy==1.5.0
588
+ fiona==1.9.6
589
+ simpervisor==1.0.0
590
+ pkgutil_resolve_name==1.3.10
591
+ sqlparse==0.5.0
592
+ filelock==3.15.1
593
+ papermill==2.6.0
594
+ blessed==1.20.0
595
+ executing==2.0.1
596
+ watchfiles==0.22.0
597
+ colorful==0.5.6
598
+ wcwidth==0.2.13
599
+ async-timeout==4.0.3
600
+ debugpy==1.8.1
601
+ pexpect==4.9.0
602
+ ptyprocess==0.7.0
603
+ google-cloud-bigtable==1.7.3
604
+ keras==3.3.3
605
+ archspec==0.2.3
606
+ nbformat==5.10.4
607
+ pins==0.8.6
608
+ gast==0.5.4
609
+ opencensus-context==0.1.3
610
+ nest-asyncio==1.6.0
611
+ ypy-websocket==0.8.4
612
+ notebook==6.5.7
613
+ exceptiongroup==1.2.0
614
+ ansicolors==1.1.8
615
+ multipledispatch==1.0.0
616
+ hdfs==2.7.3
617
+ jupyterlab_widgets==3.0.11
618
+ Babel==2.15.0
619
+ simple_parsing==0.1.5
620
+ dacite==1.8.1
621
+ cligj==0.7.2
622
+ fastavro==1.9.4
623
+ tifffile==2024.5.22
624
+ python-json-logger==2.0.7
625
+ cachetools==5.3.3
626
+ cachetools==4.2.4
627
+ tornado==6.4.1
628
+ tangled-up-in-unicode==0.2.0
629
+ anyio==4.4.0
630
+ docstring_parser==0.16
631
+ pickleshare==0.7.5
632
+ sqlglot==19.9.0
633
+ bigframes==0.22.0
634
+ bleach==6.1.0
635
+ keyrings.google-artifactregistry-auth==1.1.2
636
+ tinycss2==1.3.0
637
+ cached-property==1.5.2
638
+ pymongo==3.13.0
639
+ atpublic==4.1.0
640
+ cloud-tpu-client==0.10
641
+ tensorflow-metadata==0.14.0
642
+ urllib3==1.26.18
643
+ urllib3==2.2.1
644
+ pyu2f==0.1.5
645
+ mdit-py-plugins==0.4.1
646
+ terminado==0.18.1
647
+ Brotli==1.1.0
648
+ grpc-interceptor==0.15.4
649
+ uvicorn==0.30.1
650
+ tensorflow-io-gcs-filesystem==0.37.0
651
+ nb_conda==2.2.1
652
+ httplib2==0.21.0
653
+ gpustat==1.0.0
654
+ yarl==1.9.4
655
+ importlib-metadata==7.0.0
656
+ httpx==0.27.0
657
+ distro==1.9.0
658
+ PyWavelets==1.6.0
659
+ jupyter_server_ydoc==0.8.0
660
+ pyasn1==0.6.0
661
+ phik==0.12.4
662
+ cloud-tpu-profiler==2.4.0
663
+ email_validator==2.1.1
664
+ keras-tuner==1.4.7
665
+ array_record==0.5.1
666
+ fasteners==0.19
667
+ colorama==0.4.6
668
+ matplotlib-inline==0.1.7
669
+ nb_conda_kernels==2.5.1
670
+ beautifulsoup4==4.12.3
671
+ apache-beam==2.46.0
672
+ tabulate==0.9.0
673
+ tomli==2.0.1
674
+ notebook_shim==0.2.4
675
+ kfp==2.5.0
676
+ jupyter-http-over-ws==0.0.8
677
+ jsonpatch==1.33
678
+ threadpoolctl==3.5.0
679
+ ujson==5.10.0
680
+ tensorboard==2.16.2
681
+ aiosqlite==0.20.0
682
+ jaraco.classes==3.4.0
683
+ soupsieve==2.5
684
+ visions==0.7.5
685
+ scikit-image==0.23.2
686
+ gitdb==4.0.11
687
+ pendulum==3.0.0
688
+ memray==1.12.0
689
+ notebook_executor==0.2
690
+ google-crc32c==1.5.0
691
+ frozendict==2.4.4
692
+ geopandas==0.14.4
693
+ jax-jumpy==1.0.0
694
+ optree==0.11.0
695
+ pyzmq==26.0.3
696
+ opentelemetry-exporter-otlp-proto-common==1.25.0
697
+ uc-micro-py==1.0.3
698
+ xxhash==3.4.1
699
+ pyasn1_modules==0.4.0
700
+ uritemplate==3.0.1
701
+ more-itertools==10.3.0
702
+ prettytable==3.10.0
703
+ promise==2.3
704
+ pycosat==0.6.6
705
+ google-auth-oauthlib==1.2.0
706
+ traitlets==5.14.3
707
+ conda_package_streaming==0.10.0
708
+ ruamel.yaml==0.18.6
709
+ google-cloud-spanner==3.47.0
710
+ rfc3986-validator==0.1.1
711
+ Send2Trash==1.8.3
712
+ prompt_toolkit==3.0.47
713
+ sniffio==1.3.1
714
+ keyring==25.2.1
715
+ referencing==0.35.1
716
+ google-cloud-dlp==3.18.0
717
+ conda-package-handling==2.3.0
718
+ websockets==12.0
719
+ flatbuffers==24.3.25
720
+ jupyter-server-mathjax==0.2.6
721
+ comm==0.2.2
722
+ opentelemetry-exporter-otlp-proto-http==1.25.0
723
+ websocket-client==1.8.0
724
+ requests==2.32.3
725
+ retrying==1.3.3
726
+ retrying==1.3.4
727
+ google-cloud-pubsublite==1.10.0
728
+ explainable-ai-sdk==1.3.3
729
+ jsonpointer==2.4
730
+ typing_extensions==4.12.2
731
+ backports.tarfile==1.2.0
732
+ dnspython==2.6.1
733
+ Farama-Notifications==0.0.4
734
+ opentelemetry-sdk==1.25.0
735
+ docopt==0.6.2
736
+ ibis-framework==7.1.0
737
+ jaraco.functools==4.0.1
738
+ gviz-api==1.10.0
739
+ frozenlist==1.4.1
740
+ google-apitools==0.5.31
741
+ python-multipart==0.0.9
742
+ SQLAlchemy==2.0.30
743
+ kubernetes==26.1.0
744
+ witwidget==1.8.1
745
+ docker==7.1.0
746
+ bidict==0.23.1
747
+ jupyter-events==0.10.0
748
+ beatrix_jupyterlab==2024.66.154055
749
+ imageio==2.34.1
750
+ arrow==1.3.0
751
+ nbclassic==1.1.0
752
+ tqdm==4.66.4
753
+ networkx==3.3
754
+ python-dotenv==1.0.1
755
+ tf_keras==2.16.0
756
+ oauth2client==4.1.3
757
+ kt-legacy==1.0.5
758
+ fastapi==0.111.0
759
+ db-dtypes==1.2.0
760
+ SecretStorage==3.3.3
761
+ seaborn==0.12.2
762
+ rfc3339-validator==0.1.4
763
+ tensorflow-io==0.37.0
764
+ typing-utils==0.1.0
765
+ jupytext==1.16.2
766
+ jsonschema==4.22.0
767
+ humanize==4.9.0
768
+ google-cloud-functions==1.16.3
769
+ jaraco.context==5.3.0
770
+ htmlmin==0.1.12
771
+ tensorflow-transform==0.14.0
772
+ jupyter_server_proxy==4.2.0
773
+ crcmod==1.7
774
+ boltons==24.0.0
775
+ ruamel.yaml.clib==0.2.8
776
+ jupyter_client==7.4.9
777
+ json5==0.9.25
778
+ tensorboard-data-server==0.7.2
779
+ aiosignal==1.3.1
780
+ types-python-dateutil==2.9.0.20240316
781
+ etils==1.7.0
782
+ plotly==5.22.0
783
+ regex==2024.5.15
784
+ dataproc_jupyter_plugin==0.1.79
785
+ pyOpenSSL==24.0.0
786
+ py-spy==0.3.14
787
+ dm-tree==0.1.8
788
+ ray==2.24.0
789
+ Pygments==2.18.0
790
+ rsa==4.9
791
+ bq_helper==0.4.1
wandb/run-20241127_184914-lig8s4o3/files/wandb-metadata.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-6.6.56+-x86_64-with-glibc2.35",
3
+ "python": "3.10.14",
4
+ "startedAt": "2024-11-27T18:49:14.421527Z",
5
+ "program": "kaggle.ipynb",
6
+ "email": "[email protected]",
7
+ "root": "/kaggle/working",
8
+ "host": "f5b68522d064",
9
+ "username": "root",
10
+ "executable": "/opt/conda/bin/python3.10",
11
+ "cpu_count": 2,
12
+ "cpu_count_logical": 4,
13
+ "gpu": "Tesla P100-PCIE-16GB",
14
+ "gpu_count": 1,
15
+ "disk": {
16
+ "/": {
17
+ "total": "8656922775552",
18
+ "used": "6372786524160"
19
+ }
20
+ },
21
+ "memory": {
22
+ "total": "33662345216"
23
+ },
24
+ "cpu": {
25
+ "count": 2,
26
+ "countLogical": 4
27
+ },
28
+ "gpu_nvidia": [
29
+ {
30
+ "name": "Tesla P100-PCIE-16GB",
31
+ "memoryTotal": "17179869184",
32
+ "cudaCores": 3584,
33
+ "architecture": "Pascal"
34
+ }
35
+ ],
36
+ "cudaVersion": "12.6"
37
+ }
wandb/run-20241127_184914-lig8s4o3/logs/debug-core.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2024-11-27T18:49:14.085017787Z","level":"INFO","msg":"started logging, with flags","port-filename":"/tmp/tmpz8pp5m4x/port-2090.txt","pid":2090,"debug":false,"disable-analytics":false}
2
+ {"time":"2024-11-27T18:49:14.085061409Z","level":"INFO","msg":"FeatureState","shutdownOnParentExitEnabled":false}
3
+ {"time":"2024-11-27T18:49:14.090284062Z","level":"INFO","msg":"Will exit if parent process dies.","ppid":2090}
4
+ {"time":"2024-11-27T18:49:14.090224801Z","level":"INFO","msg":"server is running","addr":{"IP":"127.0.0.1","Port":33757,"Zone":""}}
5
+ {"time":"2024-11-27T18:49:14.277241846Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"127.0.0.1:50102"}
6
+ {"time":"2024-11-27T18:49:14.4236435Z","level":"INFO","msg":"handleInformInit: received","streamId":"lig8s4o3","id":"127.0.0.1:50102"}
7
+ {"time":"2024-11-27T18:49:14.52717192Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"lig8s4o3","id":"127.0.0.1:50102"}
wandb/run-20241127_184914-lig8s4o3/logs/debug-internal.log ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-11-27T18:49:14.423820992Z","level":"INFO","msg":"using version","core version":"0.18.7"}
2
+ {"time":"2024-11-27T18:49:14.423845654Z","level":"INFO","msg":"created symlink","path":"/kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug-core.log"}
3
+ {"time":"2024-11-27T18:49:14.527132732Z","level":"INFO","msg":"created new stream","id":"lig8s4o3"}
4
+ {"time":"2024-11-27T18:49:14.527165937Z","level":"INFO","msg":"stream: started","id":"lig8s4o3"}
5
+ {"time":"2024-11-27T18:49:14.527203552Z","level":"INFO","msg":"writer: Do: started","stream_id":"lig8s4o3"}
6
+ {"time":"2024-11-27T18:49:14.527212524Z","level":"INFO","msg":"handler: started","stream_id":"lig8s4o3"}
7
+ {"time":"2024-11-27T18:49:14.527250309Z","level":"INFO","msg":"sender: started","stream_id":"lig8s4o3"}
8
+ {"time":"2024-11-27T18:49:16.008654965Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-11-27T18:49:16.637945267Z","level":"INFO","msg":"Pausing system monitor"}
10
+ {"time":"2024-11-27T18:49:16.638015431Z","level":"INFO","msg":"Resuming system monitor"}
11
+ {"time":"2024-11-27T18:49:16.638022617Z","level":"INFO","msg":"Pausing system monitor"}
12
+ {"time":"2024-11-27T18:49:16.638027426Z","level":"INFO","msg":"Resuming system monitor"}
13
+ {"time":"2024-11-27T18:49:16.638031951Z","level":"INFO","msg":"Pausing system monitor"}
14
+ {"time":"2024-11-27T18:49:16.641816205Z","level":"INFO","msg":"Resuming system monitor"}
15
+ {"time":"2024-11-27T18:49:17.996060396Z","level":"INFO","msg":"Pausing system monitor"}
16
+ {"time":"2024-11-27T18:49:18.259742288Z","level":"INFO","msg":"Resuming system monitor"}
wandb/run-20241127_184914-lig8s4o3/logs/debug.log ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Current SDK version is 0.18.7
2
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Configure stats pid to 2090
3
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from /root/.config/wandb/settings
4
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from /kaggle/working/wandb/settings
5
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Loading settings from environment variables: {}
6
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
7
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program': '<python with no main file>'}
8
+ 2024-11-27 18:49:14,418 INFO MainThread:2090 [wandb_setup.py:_flush():79] Applying login settings: {}
9
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_log_setup():533] Logging user logs to /kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug.log
10
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_log_setup():534] Logging internal logs to /kaggle/working/wandb/run-20241127_184914-lig8s4o3/logs/debug-internal.log
11
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:_jupyter_setup():479] configuring jupyter hooks <wandb.sdk.wandb_init._WandbInit object at 0x7f50757af550>
12
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():619] calling init triggers
13
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():626] wandb.init called with sweep_config: {}
14
+ config: {'batch_size': 4, 'learning_rate': 0.0003, 'num_epochs': 10}
15
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():669] starting backend
16
+ 2024-11-27 18:49:14,419 INFO MainThread:2090 [wandb_init.py:init():673] sending inform_init request
17
+ 2024-11-27 18:49:14,420 INFO MainThread:2090 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-11-27 18:49:14,421 INFO MainThread:2090 [wandb_init.py:init():686] backend started and connected
19
+ 2024-11-27 18:49:14,433 INFO MainThread:2090 [wandb_run.py:_label_probe_notebook():1339] probe notebook
20
+ 2024-11-27 18:49:15,672 INFO MainThread:2090 [wandb_init.py:init():781] updated telemetry
21
+ 2024-11-27 18:49:15,675 INFO MainThread:2090 [wandb_init.py:init():814] communicating run to backend with 90.0 second timeout
22
+ 2024-11-27 18:49:16,004 INFO MainThread:2090 [wandb_init.py:init():867] starting run threads in backend
23
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_console_start():2456] atexit reg
24
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_redirect():2305] redirect: wrap_raw
25
+ 2024-11-27 18:49:16,599 INFO MainThread:2090 [wandb_run.py:_redirect():2370] Wrapping output streams.
26
+ 2024-11-27 18:49:16,600 INFO MainThread:2090 [wandb_run.py:_redirect():2395] Redirects installed.
27
+ 2024-11-27 18:49:16,604 INFO MainThread:2090 [wandb_init.py:init():911] run started, returning control to user process
28
+ 2024-11-27 18:49:16,605 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
29
+ 2024-11-27 18:49:16,605 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
30
+ 2024-11-27 18:49:16,615 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
31
+ 2024-11-27 18:49:16,617 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
32
+ 2024-11-27 18:49:16,617 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
33
+ 2024-11-27 18:49:16,623 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
34
+ 2024-11-27 18:49:16,635 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
35
+ 2024-11-27 18:49:16,635 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
36
+ 2024-11-27 18:49:16,641 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
37
+ 2024-11-27 18:49:17,995 INFO MainThread:2090 [jupyter.py:save_ipynb():387] not saving jupyter notebook
38
+ 2024-11-27 18:49:17,995 INFO MainThread:2090 [wandb_init.py:_pause_backend():444] pausing backend
39
+ 2024-11-27 18:49:18,259 INFO MainThread:2090 [wandb_init.py:_resume_backend():449] resuming backend
40
+ 2024-11-27 18:49:18,647 INFO MainThread:2090 [wandb_run.py:_config_callback():1387] config_cb None None {'use_timm_backbone': True, 'backbone_config': None, 'num_channels': 3, 'num_queries': 100, 'd_model': 256, 'encoder_ffn_dim': 2048, 'encoder_layers': 6, 'encoder_attention_heads': 8, 'decoder_ffn_dim': 2048, 'decoder_layers': 6, 'decoder_attention_heads': 8, 'dropout': 0.1, 'attention_dropout': 0.0, 'activation_dropout': 0.0, 'activation_function': 'relu', 'init_std': 0.02, 'init_xavier_std': 1.0, 'encoder_layerdrop': 0.0, 'decoder_layerdrop': 0.0, 'num_hidden_layers': 6, 'auxiliary_loss': False, 'position_embedding_type': 'sine', 'backbone': 'resnet50', 'use_pretrained_backbone': True, 'backbone_kwargs': {'output_stride': 16, 'out_indices': [1, 2, 3, 4], 'in_chans': 3}, 'dilation': True, 'class_cost': 1, 'bbox_cost': 5, 'giou_cost': 2, 'mask_loss_coefficient': 1, 'dice_loss_coefficient': 1, 'bbox_loss_coefficient': 5, 'giou_loss_coefficient': 2, 'eos_coefficient': 0.1, 'return_dict': True, 'output_hidden_states': False, 'output_attentions': False, 'torchscript': False, 'torch_dtype': None, 'use_bfloat16': False, 'tf_legacy_loss': False, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': True, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'architectures': ['DetrForObjectDetection'], 'finetuning_task': None, 'id2label': {0: 'object', 1: 'balloon'}, 'label2id': {'object': 0, 'balloon': 1}, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'task_specific_params': None, 'problem_type': None, '_name_or_path': 'facebook/detr-resnet-50-dc5', '_attn_implementation_autoset': True, 'transformers_version': '4.46.3', 'classifier_dropout': 0.0, 'max_position_embeddings': 1024, 'model_type': 'detr', 'scale_embedding': False, 'output_dir': '.', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.0001, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': 400, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': './runs/Nov27_18-49-17_f5b68522d064', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 10, 'save_total_limit': 2, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': True, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 10, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': '.', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': False, 'hub_always_push': False, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': 'steps', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': True, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False}
41
+ 2024-11-27 18:49:18,653 INFO MainThread:2090 [wandb_config.py:__setitem__():154] config set model/num_parameters = 41501895 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f507463aad0>>
42
+ 2024-11-27 18:49:18,653 INFO MainThread:2090 [wandb_run.py:_config_callback():1387] config_cb model/num_parameters 41501895 None
wandb/run-20241127_184914-lig8s4o3/run-lig8s4o3.wandb ADDED
File without changes