jgchaparro commited on
Commit
d3e57c3
·
verified ·
1 Parent(s): 1dff8d3

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (2) hide show
  1. adapter_config.json +6 -14
  2. adapter_model.safetensors +2 -2
adapter_config.json CHANGED
@@ -3,11 +3,11 @@
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": {
6
- "base_model_class": "DeepseekOCRForCausalLM",
7
- "parent_library": "transformers_modules.unsloth.DeepSeek-OCR.b03c14faaf5aa8421bfa15ef08cec5c628b10662.modeling_deepseekocr",
8
  "unsloth_fixed": true
9
  },
10
- "base_model_name_or_path": "unsloth/DeepSeek-OCR",
11
  "bias": "none",
12
  "corda_config": null,
13
  "ensure_weight_tying": false,
@@ -20,7 +20,7 @@
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
- "lora_alpha": 32,
24
  "lora_bias": false,
25
  "lora_dropout": 0,
26
  "megatron_config": null,
@@ -29,18 +29,10 @@
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.0",
31
  "qalora_group_size": 16,
32
- "r": 32,
33
  "rank_pattern": {},
34
  "revision": null,
35
- "target_modules": [
36
- "gate_proj",
37
- "v_proj",
38
- "o_proj",
39
- "k_proj",
40
- "up_proj",
41
- "down_proj",
42
- "q_proj"
43
- ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
46
  "trainable_token_indices": null,
 
3
  "alpha_pattern": {},
4
  "arrow_config": null,
5
  "auto_mapping": {
6
+ "base_model_class": "Gemma3ForConditionalGeneration",
7
+ "parent_library": "transformers.models.gemma3.modeling_gemma3",
8
  "unsloth_fixed": true
9
  },
10
+ "base_model_name_or_path": "unsloth/gemma-3-4b-pt-unsloth-bnb-4bit",
11
  "bias": "none",
12
  "corda_config": null,
13
  "ensure_weight_tying": false,
 
20
  "layers_pattern": null,
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
+ "lora_alpha": 16,
24
  "lora_bias": false,
25
  "lora_dropout": 0,
26
  "megatron_config": null,
 
29
  "peft_type": "LORA",
30
  "peft_version": "0.18.0",
31
  "qalora_group_size": 16,
32
+ "r": 16,
33
  "rank_pattern": {},
34
  "revision": null,
35
+ "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:k_proj|v_proj|q_proj|out_proj|fc1|fc2|o_proj|gate_proj|up_proj|down_proj)))",
 
 
 
 
 
 
 
 
36
  "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cdfb63ef9c4650633532d9449c9bb47b0b37d2f342e69ba2b82d36b29379fb8d
3
- size 620702632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:148bfd3575ed5534c567f5a056ca05661f58ae0f4c04d9a66b871f29e645df11
3
+ size 154116312