mlx-community
/

gemma-3n-E4B-it-4bit

@@ -8,8 +8,6 @@
         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
-        "use_bfloat16": false,
-        "tf_legacy_loss": false,
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
@@ -18,6 +16,25 @@
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
@@ -43,27 +60,10 @@
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
-        "architectures": null,
-        "finetuning_task": null,
-        "id2label": {
-            "0": "LABEL_0",
-            "1": "LABEL_1"
-        },
-        "label2id": {
-            "LABEL_0": 0,
-            "LABEL_1": 1
-        },
-        "tokenizer_class": null,
-        "prefix": null,
-        "bos_token_id": null,
-        "pad_token_id": null,
-        "eos_token_id": null,
-        "sep_token_id": null,
-        "decoder_start_token_id": null,
-        "task_specific_params": null,
-        "problem_type": null,
         "_name_or_path": "",
         "model_type": "gemma3n_audio",
         "input_feat_size": 128,
         "hidden_size": 1536,
         "rms_norm_eps": 1e-06,
@@ -3940,8 +3940,6 @@
         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
-        "use_bfloat16": false,
-        "tf_legacy_loss": false,
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
@@ -3950,6 +3948,25 @@
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
@@ -3975,27 +3992,10 @@
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
-        "architectures": null,
-        "finetuning_task": null,
-        "id2label": {
-            "0": "LABEL_0",
-            "1": "LABEL_1"
-        },
-        "label2id": {
-            "LABEL_0": 0,
-            "LABEL_1": 1
-        },
-        "tokenizer_class": null,
-        "prefix": null,
-        "bos_token_id": 2,
-        "pad_token_id": 0,
-        "eos_token_id": 1,
-        "sep_token_id": null,
-        "decoder_start_token_id": null,
-        "task_specific_params": null,
-        "problem_type": null,
         "_name_or_path": "",
         "model_type": "gemma3n_text",
         "vocab_size": 262400,
         "vocab_size_per_layer_input": 262144,
         "max_position_embeddings": 32768,
@@ -4142,7 +4142,7 @@
     "top_k": 50,
     "top_p": 1.0,
     "torchscript": false,
-    "transformers_version": "4.53.2",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "vision_config": {
@@ -4150,8 +4150,6 @@
         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
-        "use_bfloat16": false,
-        "tf_legacy_loss": false,
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
@@ -4160,6 +4158,17 @@
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
@@ -4185,17 +4194,6 @@
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
-        "architectures": null,
-        "finetuning_task": null,
-        "tokenizer_class": null,
-        "prefix": null,
-        "bos_token_id": null,
-        "pad_token_id": null,
-        "eos_token_id": null,
-        "sep_token_id": null,
-        "decoder_start_token_id": null,
-        "task_specific_params": null,
-        "problem_type": null,
         "_name_or_path": "",
         "label_names": [
             "LABEL_0",
@@ -4203,6 +4201,8 @@
         ],
         "model_type": "gemma3n_vision",
         "num_classes": 2,
         "initializer_range": 0.02,
         "do_pooling": false,
         "model_args": null,

         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "task_specific_params": null,
+        "problem_type": null,
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": null,
+        "pad_token_id": null,
+        "eos_token_id": null,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
         "_name_or_path": "",
         "model_type": "gemma3n_audio",
+        "tf_legacy_loss": false,
+        "use_bfloat16": false,
         "input_feat_size": 128,
         "hidden_size": 1536,
         "rms_norm_eps": 1e-06,
         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
+        "architectures": null,
+        "finetuning_task": null,
+        "id2label": {
+            "0": "LABEL_0",
+            "1": "LABEL_1"
+        },
+        "label2id": {
+            "LABEL_0": 0,
+            "LABEL_1": 1
+        },
+        "task_specific_params": null,
+        "problem_type": null,
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": 2,
+        "pad_token_id": 0,
+        "eos_token_id": 1,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
         "_name_or_path": "",
         "model_type": "gemma3n_text",
+        "tf_legacy_loss": false,
+        "use_bfloat16": false,
         "vocab_size": 262400,
         "vocab_size_per_layer_input": 262144,
         "max_position_embeddings": 32768,
     "top_k": 50,
     "top_p": 1.0,
     "torchscript": false,
+    "transformers_version": "4.54.0.dev0",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "vision_config": {
         "output_hidden_states": false,
         "torchscript": false,
         "torch_dtype": "bfloat16",
         "pruned_heads": {},
         "tie_word_embeddings": true,
         "chunk_size_feed_forward": 0,
         "cross_attention_hidden_size": null,
         "add_cross_attention": false,
         "tie_encoder_decoder": false,
+        "architectures": null,
+        "finetuning_task": null,
+        "task_specific_params": null,
+        "problem_type": null,
+        "tokenizer_class": null,
+        "prefix": null,
+        "bos_token_id": null,
+        "pad_token_id": null,
+        "eos_token_id": null,
+        "sep_token_id": null,
+        "decoder_start_token_id": null,
         "max_length": 20,
         "min_length": 0,
         "do_sample": false,
         "exponential_decay_length_penalty": null,
         "suppress_tokens": null,
         "begin_suppress_tokens": null,
         "_name_or_path": "",
         "label_names": [
             "LABEL_0",
         ],
         "model_type": "gemma3n_vision",
         "num_classes": 2,
+        "tf_legacy_loss": false,
+        "use_bfloat16": false,
         "initializer_range": 0.02,
         "do_pooling": false,
         "model_args": null,

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:709e3fa64911e5a753395f0e18181471794f239baffd7dac455f4befcb326df1
-size 5364004839

 version https://git-lfs.github.com/spec/v1
+oid sha256:35481571d6ab17a60515c4378e3f3c171edb0e7fbe908e8db9d0f49f2838a544
+size 5364004911

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ffa02c7d3402c85b43798b966bb1a9da3b7ff1b2312909770a3321f3327d9ba9
 size 455053642

 version https://git-lfs.github.com/spec/v1
+oid sha256:62ae1980a669cca260a3a3a4a3efc4285d861b9be2df4c7da98c8ac61420d1f7
 size 455053642