rimashussain commited on
Commit
f194141
·
verified ·
1 Parent(s): 96e363a

Arsenal fine-tune round 1

Browse files
Files changed (2) hide show
  1. adapter_config.json +5 -21
  2. adapter_model.safetensors +2 -2
adapter_config.json CHANGED
@@ -1,18 +1,8 @@
1
  {
2
- "alora_invocation_tokens": null,
3
  "alpha_pattern": {},
4
- "arrow_config": null,
5
- "auto_mapping": {
6
- "base_model_class": "Gemma4ForConditionalGeneration",
7
- "parent_library": "transformers.models.gemma4.modeling_gemma4",
8
- "unsloth_fixed": true
9
- },
10
- "base_model_name_or_path": "google/gemma-4-E4B-it",
11
  "bias": "none",
12
- "corda_config": null,
13
- "ensure_weight_tying": false,
14
- "eva_config": null,
15
- "exclude_modules": null,
16
  "fan_in_fan_out": false,
17
  "inference_mode": true,
18
  "init_lora_weights": true,
@@ -21,22 +11,16 @@
21
  "layers_to_transform": null,
22
  "loftq_config": {},
23
  "lora_alpha": 16,
24
- "lora_bias": false,
25
- "lora_dropout": 0,
26
  "megatron_config": null,
27
  "megatron_core": "megatron.core",
28
  "modules_to_save": null,
29
  "peft_type": "LORA",
30
- "peft_version": "0.18.1",
31
- "qalora_group_size": 16,
32
- "r": 16,
33
  "rank_pattern": {},
34
  "revision": null,
35
- "target_modules": "(?:.*?(?:vision|image|visual|patch|language|text).*?(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense).*?(?:k_proj|q_proj|v_proj|o_proj|gate_proj|up_proj|down_proj|per_layer_input_gate|per_layer_projection|linear|embedding_projection|relative_k_proj).*?)|(?:\\bmodel\\.layers\\.[\\d]{1,}\\.(?:self_attn|attention|attn|mlp|feed_forward|ffn|dense)\\.(?:(?:k_proj|q_proj|v_proj|o_proj|gate_proj|up_proj|down_proj|per_layer_input_gate|per_layer_projection|linear|embedding_projection|relative_k_proj)))",
36
- "target_parameters": null,
37
  "task_type": "CAUSAL_LM",
38
- "trainable_token_indices": null,
39
  "use_dora": false,
40
- "use_qalora": false,
41
  "use_rslora": false
42
  }
 
1
  {
 
2
  "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "google/gemma-3-4b-it",
 
 
 
 
 
5
  "bias": "none",
 
 
 
 
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
14
+ "lora_dropout": 0.05,
 
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
17
  "modules_to_save": null,
18
  "peft_type": "LORA",
19
+ "r": 8,
 
 
20
  "rank_pattern": {},
21
  "revision": null,
22
+ "target_modules": "model\\.language_model\\.layers\\.\\d+\\.self_attn\\.(q_proj|v_proj|k_proj|o_proj)",
 
23
  "task_type": "CAUSAL_LM",
 
24
  "use_dora": false,
 
25
  "use_rslora": false
26
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0663609dd1947c4941f45705ed136968babe5c8462a9cfa9fdbf32b56f3716bf
3
- size 165012392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1c1e44955730b5ebfb1224295d68118ff0d2bcd4df7968334227774742d8131
3
+ size 17865944