Upload folder using huggingface_hub

Files changed (4) hide show

config.json CHANGED Viewed

@@ -77,7 +77,6 @@
     "vocab_size": 128
   },
   "audio_ms_per_token": 40,
-  "audio_soft_tokens_per_image": 750,
   "audio_token_id": 258881,
   "boa_token_id": 256000,
   "boi_token_id": 255999,
@@ -92,7 +91,6 @@
     "attention_bias": false,
     "attention_dropout": 0.0,
     "attention_k_eq_v": false,
-    "attention_use_bidirectional": null,
     "attn_logit_softcapping": null,
     "bos_token_id": 2,
     "dtype": "bfloat16",
@@ -224,9 +222,7 @@
       }
     },
     "use_bidirectional_attention": "vision",
-    "use_clipped_linears": true,
-    "vocab_offset": 262144,
-    "vocab_size": 128
   },
   "vision_soft_tokens_per_image": 280
 }

     "vocab_size": 128
   },
   "audio_ms_per_token": 40,
   "audio_token_id": 258881,
   "boa_token_id": 256000,
   "boi_token_id": 255999,
     "attention_bias": false,
     "attention_dropout": 0.0,
     "attention_k_eq_v": false,
     "attn_logit_softcapping": null,
     "bos_token_id": 2,
     "dtype": "bfloat16",
       }
     },
     "use_bidirectional_attention": "vision",
+    "use_clipped_linears": true
   },
   "vision_soft_tokens_per_image": 280
 }

generation_config.json CHANGED Viewed

@@ -1,6 +1,5 @@
 {
   "bos_token_id": 2,
-  "cache_implementation": "hybrid",
   "do_sample": true,
   "eos_token_id": 1,
   "pad_token_id": 0,

 {
   "bos_token_id": 2,
   "do_sample": true,
   "eos_token_id": 1,
   "pad_token_id": 0,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e908419f2891b4cddaff87506a21aa22fce730e9dac81ef1ae59d85d412d8f6
-size 10246627534

 version https://git-lfs.github.com/spec/v1
+oid sha256:e59bd7848f7cb681a779caa038283840a47d3766171ab75fa07a5ea9a45e6c56
+size 10246628830

processor_config.json CHANGED Viewed

@@ -5,8 +5,8 @@
     "dither": 0.0,
     "feature_extractor_type": "Gemma4AudioFeatureExtractor",
     "feature_size": 128,
-    "fft_length": 1024,
-    "fft_overdrive": true,
     "frame_length": 320,
     "hop_length": 160,
     "input_scale_factor": 1.0,

     "dither": 0.0,
     "feature_extractor_type": "Gemma4AudioFeatureExtractor",
     "feature_size": 128,
+    "fft_length": 512,
+    "fft_overdrive": false,
     "frame_length": 320,
     "hop_length": 160,
     "input_scale_factor": 1.0,