Upload model trained with Unsloth

Upload model trained with Unsloth 2x faster

Files changed (2) hide show

adapter_config.json CHANGED Viewed

@@ -3,11 +3,11 @@
   "alpha_pattern": {},
   "arrow_config": null,
   "auto_mapping": {
-    "base_model_class": "DeepseekOCRForCausalLM",
-    "parent_library": "transformers_modules.unsloth.DeepSeek-OCR.b03c14faaf5aa8421bfa15ef08cec5c628b10662.modeling_deepseekocr",
     "unsloth_fixed": true
   },
-  "base_model_name_or_path": "unsloth/DeepSeek-OCR",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
@@ -20,7 +20,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 32,
   "lora_bias": false,
   "lora_dropout": 0,
   "megatron_config": null,
@@ -29,18 +29,10 @@
   "peft_type": "LORA",
   "peft_version": "0.18.0",
   "qalora_group_size": 16,
-  "r": 32,
   "rank_pattern": {},
   "revision": null,
-  "target_modules": [
-    "gate_proj",
-    "v_proj",
-    "o_proj",
-    "k_proj",
-    "up_proj",
-    "down_proj",
-    "q_proj"
-  ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "alpha_pattern": {},
   "arrow_config": null,
   "auto_mapping": {
+    "base_model_class": "Gemma3ForConditionalGeneration",
+    "parent_library": "transformers.models.gemma3.modeling_gemma3",
     "unsloth_fixed": true
   },
+  "base_model_name_or_path": "unsloth/gemma-3-4b-pt-unsloth-bnb-4bit",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 16,
   "lora_bias": false,
   "lora_dropout": 0,
   "megatron_config": null,
   "peft_type": "LORA",
   "peft_version": "0.18.0",
   "qalora_group_size": 16,
+  "r": 16,
   "rank_pattern": {},
   "revision": null,
+  "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj)))",
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cdfb63ef9c4650633532d9449c9bb47b0b37d2f342e69ba2b82d36b29379fb8d
-size 620702632

 version https://git-lfs.github.com/spec/v1
+oid sha256:148bfd3575ed5534c567f5a056ca05661f58ae0f4c04d9a66b871f29e645df11
+size 154116312