prithivMLmods commited on 23 days ago

Commit

94b7583

verified ·

1 Parent(s): 5f4bcc6

Upload folder using huggingface_hub

Browse files

Files changed (36) hide show

checkpoint-1876/config.json +70 -0
checkpoint-1876/model.safetensors +3 -0
checkpoint-1876/optimizer.pt +3 -0
checkpoint-1876/preprocessor_config.json +29 -0
checkpoint-1876/rng_state.pth +3 -0
checkpoint-1876/scheduler.pt +3 -0
checkpoint-1876/trainer_state.json +75 -0
checkpoint-1876/training_args.bin +3 -0
checkpoint-2814/config.json +70 -0
checkpoint-2814/model.safetensors +3 -0
checkpoint-2814/optimizer.pt +3 -0
checkpoint-2814/preprocessor_config.json +29 -0
checkpoint-2814/rng_state.pth +3 -0
checkpoint-2814/scheduler.pt +3 -0
checkpoint-2814/trainer_state.json +99 -0
checkpoint-2814/training_args.bin +3 -0
checkpoint-3752/config.json +70 -0
checkpoint-3752/model.safetensors +3 -0
checkpoint-3752/optimizer.pt +3 -0
checkpoint-3752/preprocessor_config.json +29 -0
checkpoint-3752/rng_state.pth +3 -0
checkpoint-3752/scheduler.pt +3 -0
checkpoint-3752/trainer_state.json +123 -0
checkpoint-3752/training_args.bin +3 -0
checkpoint-938/config.json +70 -0
checkpoint-938/model.safetensors +3 -0
checkpoint-938/optimizer.pt +3 -0
checkpoint-938/preprocessor_config.json +29 -0
checkpoint-938/rng_state.pth +3 -0
checkpoint-938/scheduler.pt +3 -0
checkpoint-938/trainer_state.json +51 -0
checkpoint-938/training_args.bin +3 -0
config.json +70 -0
model.safetensors +3 -0
preprocessor_config.json +29 -0
training_args.bin +3 -0

checkpoint-1876/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "MetaClip2ForImageClassification"
+  ],
+  "dtype": "float32",
+  "id2label": {
+    "0": "airplane",
+    "1": "automobile",
+    "2": "bird",
+    "3": "cat",
+    "4": "deer",
+    "5": "dog",
+    "6": "frog",
+    "7": "horse",
+    "8": "ship",
+    "9": "truck"
+  },
+  "initializer_factor": 1.0,
+  "label2id": {
+    "airplane": 0,
+    "automobile": 1,
+    "bird": 2,
+    "cat": 3,
+    "deer": 4,
+    "dog": 5,
+    "frog": 6,
+    "horse": 7,
+    "ship": 8,
+    "truck": 9
+  },
+  "logit_scale_init_value": 2.6592,
+  "model_type": "metaclip_2",
+  "problem_type": "single_label_classification",
+  "projection_dim": 384,
+  "text_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "eos_token_id": 2,
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "max_position_embeddings": 77,
+    "model_type": "metaclip_2_text_model",
+    "num_attention_heads": 6,
+    "num_hidden_layers": 12,
+    "projection_dim": 384,
+    "vocab_size": 901629
+  },
+  "transformers_version": "4.57.1",
+  "vision_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "image_size": 224,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "model_type": "metaclip_2_vision_model",
+    "num_attention_heads": 6,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "patch_size": 16,
+    "projection_dim": 384
+  }
+}

checkpoint-1876/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06b29c5dd252f58b51133ed5893e0ce3794acf8ca2892fbcdb63d27d01824aa9
+size 86703248

checkpoint-1876/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b73e8d9c5816fbb85ade28f395aa076ca26cf79d703e45097e7364d569f7d6c
+size 173522699

checkpoint-1876/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "processor_class": "CLIPProcessor",
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

checkpoint-1876/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac3be64a16bd10f2df355cd871b61f0d0e89cc9247ee2c99aa3286c961b5850f
+size 14645

checkpoint-1876/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:821339f9e61aa962297cc39e7f2385be146465c890ae7b9814d27262ff2e33b9
+size 1465

checkpoint-1876/trainer_state.json ADDED Viewed

	@@ -0,0 +1,75 @@

+{
+  "best_global_step": 1876,
+  "best_metric": 0.15963459014892578,
+  "best_model_checkpoint": "metaclip-2-image-classification/checkpoint-1876",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 1876,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.5330490405117271,
+      "grad_norm": 104.10272979736328,
+      "learning_rate": 1.7574284170718533e-05,
+      "loss": 0.8655,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.92635,
+      "eval_loss": 0.2205629199743271,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 90.292,
+      "eval_samples_per_second": 221.503,
+      "eval_steps_per_second": 27.688,
+      "step": 938
+    },
+    {
+      "epoch": 1.0660980810234542,
+      "grad_norm": 53.17558670043945,
+      "learning_rate": 1.4873041599135603e-05,
+      "loss": 0.4234,
+      "step": 1000
+    },
+    {
+      "epoch": 1.5991471215351813,
+      "grad_norm": 17.705827713012695,
+      "learning_rate": 1.2171799027552675e-05,
+      "loss": 0.3154,
+      "step": 1500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9459,
+      "eval_loss": 0.15963459014892578,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 87.0564,
+      "eval_samples_per_second": 229.736,
+      "eval_steps_per_second": 28.717,
+      "step": 1876
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 3752,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.17019413504e+18,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1876/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a90bc66716cb082ec5c00af9d059cdce153b87ee7290bee045c716ff787c4e
+size 5777

checkpoint-2814/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "MetaClip2ForImageClassification"
+  ],
+  "dtype": "float32",
+  "id2label": {
+    "0": "airplane",
+    "1": "automobile",
+    "2": "bird",
+    "3": "cat",
+    "4": "deer",
+    "5": "dog",
+    "6": "frog",
+    "7": "horse",
+    "8": "ship",
+    "9": "truck"
+  },
+  "initializer_factor": 1.0,
+  "label2id": {
+    "airplane": 0,
+    "automobile": 1,
+    "bird": 2,
+    "cat": 3,
+    "deer": 4,
+    "dog": 5,
+    "frog": 6,
+    "horse": 7,
+    "ship": 8,
+    "truck": 9
+  },
+  "logit_scale_init_value": 2.6592,
+  "model_type": "metaclip_2",
+  "problem_type": "single_label_classification",
+  "projection_dim": 384,
+  "text_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "eos_token_id": 2,
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "max_position_embeddings": 77,
+    "model_type": "metaclip_2_text_model",
+    "num_attention_heads": 6,
+    "num_hidden_layers": 12,
+    "projection_dim": 384,
+    "vocab_size": 901629
+  },
+  "transformers_version": "4.57.1",
+  "vision_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "image_size": 224,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "model_type": "metaclip_2_vision_model",
+    "num_attention_heads": 6,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "patch_size": 16,
+    "projection_dim": 384
+  }
+}

checkpoint-2814/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6733ace664b06b6495f14143722f5303503b062297a2906427fbcb2e35795579
+size 86703248

checkpoint-2814/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c569dbc843448df31a15a4d0df29d70fd7c9b18fda6bc5272dbbfa1a2b3027e5
+size 173522699

checkpoint-2814/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "processor_class": "CLIPProcessor",
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

checkpoint-2814/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a29ae404595fc10a4b5a1063aa0986a935eb92411ef6f000cf138daa8193145e
+size 14645

checkpoint-2814/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe60dc1e32dfc7b25fd9e07949a92d68be512c8d17eae53c27689946c0114383
+size 1465

checkpoint-2814/trainer_state.json ADDED Viewed

	@@ -0,0 +1,99 @@

+{
+  "best_global_step": 2814,
+  "best_metric": 0.1238662451505661,
+  "best_model_checkpoint": "metaclip-2-image-classification/checkpoint-2814",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 2814,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.5330490405117271,
+      "grad_norm": 104.10272979736328,
+      "learning_rate": 1.7574284170718533e-05,
+      "loss": 0.8655,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.92635,
+      "eval_loss": 0.2205629199743271,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 90.292,
+      "eval_samples_per_second": 221.503,
+      "eval_steps_per_second": 27.688,
+      "step": 938
+    },
+    {
+      "epoch": 1.0660980810234542,
+      "grad_norm": 53.17558670043945,
+      "learning_rate": 1.4873041599135603e-05,
+      "loss": 0.4234,
+      "step": 1000
+    },
+    {
+      "epoch": 1.5991471215351813,
+      "grad_norm": 17.705827713012695,
+      "learning_rate": 1.2171799027552675e-05,
+      "loss": 0.3154,
+      "step": 1500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9459,
+      "eval_loss": 0.15963459014892578,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 87.0564,
+      "eval_samples_per_second": 229.736,
+      "eval_steps_per_second": 28.717,
+      "step": 1876
+    },
+    {
+      "epoch": 2.1321961620469083,
+      "grad_norm": 21.37250518798828,
+      "learning_rate": 9.470556455969747e-06,
+      "loss": 0.2481,
+      "step": 2000
+    },
+    {
+      "epoch": 2.6652452025586353,
+      "grad_norm": 32.63026809692383,
+      "learning_rate": 6.769313884386819e-06,
+      "loss": 0.2002,
+      "step": 2500
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9582,
+      "eval_loss": 0.1238662451505661,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 92.3095,
+      "eval_samples_per_second": 216.662,
+      "eval_steps_per_second": 27.083,
+      "step": 2814
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 3752,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.75529120256e+18,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2814/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a90bc66716cb082ec5c00af9d059cdce153b87ee7290bee045c716ff787c4e
+size 5777

checkpoint-3752/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "MetaClip2ForImageClassification"
+  ],
+  "dtype": "float32",
+  "id2label": {
+    "0": "airplane",
+    "1": "automobile",
+    "2": "bird",
+    "3": "cat",
+    "4": "deer",
+    "5": "dog",
+    "6": "frog",
+    "7": "horse",
+    "8": "ship",
+    "9": "truck"
+  },
+  "initializer_factor": 1.0,
+  "label2id": {
+    "airplane": 0,
+    "automobile": 1,
+    "bird": 2,
+    "cat": 3,
+    "deer": 4,
+    "dog": 5,
+    "frog": 6,
+    "horse": 7,
+    "ship": 8,
+    "truck": 9
+  },
+  "logit_scale_init_value": 2.6592,
+  "model_type": "metaclip_2",
+  "problem_type": "single_label_classification",
+  "projection_dim": 384,
+  "text_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "eos_token_id": 2,
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "max_position_embeddings": 77,
+    "model_type": "metaclip_2_text_model",
+    "num_attention_heads": 6,
+    "num_hidden_layers": 12,
+    "projection_dim": 384,
+    "vocab_size": 901629
+  },
+  "transformers_version": "4.57.1",
+  "vision_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "image_size": 224,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "model_type": "metaclip_2_vision_model",
+    "num_attention_heads": 6,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "patch_size": 16,
+    "projection_dim": 384
+  }
+}

checkpoint-3752/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d7590d179c1aad8be76d019c64b7308bc08954b64eebed7398a2907829697dd
+size 86703248

checkpoint-3752/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af42edc2144b4e24fca72977978dd6e390ea064412f9ecef8125eb94d23c9955
+size 173522699

checkpoint-3752/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "processor_class": "CLIPProcessor",
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

checkpoint-3752/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:483efe6d84d7c8cbfde1761fe938811764b708d5d65656ea49f25587593bbe02
+size 14645

checkpoint-3752/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba38110e0f7eb61e76afd1da99c98c0105de9e1d2f7c221704071b570a151b3c
+size 1465

checkpoint-3752/trainer_state.json ADDED Viewed

	@@ -0,0 +1,123 @@

+{
+  "best_global_step": 3752,
+  "best_metric": 0.10899118334054947,
+  "best_model_checkpoint": "metaclip-2-image-classification/checkpoint-3752",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 3752,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.5330490405117271,
+      "grad_norm": 104.10272979736328,
+      "learning_rate": 1.7574284170718533e-05,
+      "loss": 0.8655,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.92635,
+      "eval_loss": 0.2205629199743271,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 90.292,
+      "eval_samples_per_second": 221.503,
+      "eval_steps_per_second": 27.688,
+      "step": 938
+    },
+    {
+      "epoch": 1.0660980810234542,
+      "grad_norm": 53.17558670043945,
+      "learning_rate": 1.4873041599135603e-05,
+      "loss": 0.4234,
+      "step": 1000
+    },
+    {
+      "epoch": 1.5991471215351813,
+      "grad_norm": 17.705827713012695,
+      "learning_rate": 1.2171799027552675e-05,
+      "loss": 0.3154,
+      "step": 1500
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9459,
+      "eval_loss": 0.15963459014892578,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 87.0564,
+      "eval_samples_per_second": 229.736,
+      "eval_steps_per_second": 28.717,
+      "step": 1876
+    },
+    {
+      "epoch": 2.1321961620469083,
+      "grad_norm": 21.37250518798828,
+      "learning_rate": 9.470556455969747e-06,
+      "loss": 0.2481,
+      "step": 2000
+    },
+    {
+      "epoch": 2.6652452025586353,
+      "grad_norm": 32.63026809692383,
+      "learning_rate": 6.769313884386819e-06,
+      "loss": 0.2002,
+      "step": 2500
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9582,
+      "eval_loss": 0.1238662451505661,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 92.3095,
+      "eval_samples_per_second": 216.662,
+      "eval_steps_per_second": 27.083,
+      "step": 2814
+    },
+    {
+      "epoch": 3.1982942430703627,
+      "grad_norm": 37.74256896972656,
+      "learning_rate": 4.06807131280389e-06,
+      "loss": 0.1637,
+      "step": 3000
+    },
+    {
+      "epoch": 3.7313432835820897,
+      "grad_norm": 6.652950763702393,
+      "learning_rate": 1.3668287412209618e-06,
+      "loss": 0.1253,
+      "step": 3500
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.96315,
+      "eval_loss": 0.10899118334054947,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 87.3412,
+      "eval_samples_per_second": 228.987,
+      "eval_steps_per_second": 28.623,
+      "step": 3752
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 3752,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.34038827008e+18,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3752/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a90bc66716cb082ec5c00af9d059cdce153b87ee7290bee045c716ff787c4e
+size 5777

checkpoint-938/config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "MetaClip2ForImageClassification"
+  ],
+  "dtype": "float32",
+  "id2label": {
+    "0": "airplane",
+    "1": "automobile",
+    "2": "bird",
+    "3": "cat",
+    "4": "deer",
+    "5": "dog",
+    "6": "frog",
+    "7": "horse",
+    "8": "ship",
+    "9": "truck"
+  },
+  "initializer_factor": 1.0,
+  "label2id": {
+    "airplane": 0,
+    "automobile": 1,
+    "bird": 2,
+    "cat": 3,
+    "deer": 4,
+    "dog": 5,
+    "frog": 6,
+    "horse": 7,
+    "ship": 8,
+    "truck": 9
+  },
+  "logit_scale_init_value": 2.6592,
+  "model_type": "metaclip_2",
+  "problem_type": "single_label_classification",
+  "projection_dim": 384,
+  "text_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "eos_token_id": 2,
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "max_position_embeddings": 77,
+    "model_type": "metaclip_2_text_model",
+    "num_attention_heads": 6,
+    "num_hidden_layers": 12,
+    "projection_dim": 384,
+    "vocab_size": 901629
+  },
+  "transformers_version": "4.57.1",
+  "vision_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "image_size": 224,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "model_type": "metaclip_2_vision_model",
+    "num_attention_heads": 6,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "patch_size": 16,
+    "projection_dim": 384
+  }
+}

checkpoint-938/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0295970f5c5254383eea7f2873f3d585654e1367b2fd6b267f29ed9f9b3f26c4
+size 86703248

checkpoint-938/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:08e83a46af7737bff566b2f7f8b4fd87001b4bea72c17045891ca059b70fc464
+size 173522699

checkpoint-938/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "processor_class": "CLIPProcessor",
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

checkpoint-938/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:081c357ef46dc87b932a2d21b2bd7241e2c976740daddae5a5457a7579ee9392
+size 14645

checkpoint-938/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f3ff0afff6239fce33f43c7b9ade60dd4c0cca24a3033a0c5718c09cb7abd681
+size 1465

checkpoint-938/trainer_state.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "best_global_step": 938,
+  "best_metric": 0.2205629199743271,
+  "best_model_checkpoint": "metaclip-2-image-classification/checkpoint-938",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 938,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.5330490405117271,
+      "grad_norm": 104.10272979736328,
+      "learning_rate": 1.7574284170718533e-05,
+      "loss": 0.8655,
+      "step": 500
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.92635,
+      "eval_loss": 0.2205629199743271,
+      "eval_model_preparation_time": 0.0039,
+      "eval_runtime": 90.292,
+      "eval_samples_per_second": 221.503,
+      "eval_steps_per_second": 27.688,
+      "step": 938
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 3752,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5.8509706752e+17,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-938/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a90bc66716cb082ec5c00af9d059cdce153b87ee7290bee045c716ff787c4e
+size 5777

config.json ADDED Viewed

	@@ -0,0 +1,70 @@

+{
+  "architectures": [
+    "MetaClip2ForImageClassification"
+  ],
+  "dtype": "float32",
+  "id2label": {
+    "0": "airplane",
+    "1": "automobile",
+    "2": "bird",
+    "3": "cat",
+    "4": "deer",
+    "5": "dog",
+    "6": "frog",
+    "7": "horse",
+    "8": "ship",
+    "9": "truck"
+  },
+  "initializer_factor": 1.0,
+  "label2id": {
+    "airplane": 0,
+    "automobile": 1,
+    "bird": 2,
+    "cat": 3,
+    "deer": 4,
+    "dog": 5,
+    "frog": 6,
+    "horse": 7,
+    "ship": 8,
+    "truck": 9
+  },
+  "logit_scale_init_value": 2.6592,
+  "model_type": "metaclip_2",
+  "problem_type": "single_label_classification",
+  "projection_dim": 384,
+  "text_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "eos_token_id": 2,
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "max_position_embeddings": 77,
+    "model_type": "metaclip_2_text_model",
+    "num_attention_heads": 6,
+    "num_hidden_layers": 12,
+    "projection_dim": 384,
+    "vocab_size": 901629
+  },
+  "transformers_version": "4.57.1",
+  "vision_config": {
+    "attention_dropout": 0.0,
+    "dtype": "float32",
+    "hidden_act": "gelu",
+    "hidden_size": 384,
+    "image_size": 224,
+    "initializer_factor": 1.0,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "layer_norm_eps": 1e-05,
+    "model_type": "metaclip_2_vision_model",
+    "num_attention_heads": 6,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "patch_size": 16,
+    "projection_dim": 384
+  }
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d7590d179c1aad8be76d019c64b7308bc08954b64eebed7398a2907829697dd
+size 86703248

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "processor_class": "CLIPProcessor",
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 224,
+    "width": 224
+  }
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a90bc66716cb082ec5c00af9d059cdce153b87ee7290bee045c716ff787c4e
+size 5777