Ali Safaya commited on
Commit
c396b6b
·
1 Parent(s): 9251705

upgrade neurocache weights

Browse files
neurocache_adapter/adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": null,
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": false,
@@ -27,8 +27,12 @@
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
30
- "fc2",
31
- "fc1"
 
 
 
 
32
  ],
33
  "task_type": "CAUSAL_LM",
34
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "microsoft/phi-1_5",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": false,
 
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
30
+ "o_proj",
31
+ "dense",
32
+ "fc1",
33
+ "v_proj",
34
+ "q_proj",
35
+ "fc2"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "use_dora": false,
neurocache_config.json CHANGED
@@ -9,10 +9,10 @@
9
  ],
10
  "auto_mapping": null,
11
  "base_model_name_or_path": "microsoft/phi-1_5",
12
- "cache_dtype": "bfloat16",
13
- "cache_size": 524288,
14
  "cache_type": "FIFO",
15
- "compression_factor": 4,
16
  "context_size": 2,
17
  "global_cache": true,
18
  "inference_mode": true,
@@ -23,5 +23,5 @@
23
  },
24
  "similarity_fn": "l2",
25
  "task_type": "CAUSAL_LM",
26
- "topk": 16
27
- }
 
9
  ],
10
  "auto_mapping": null,
11
  "base_model_name_or_path": "microsoft/phi-1_5",
12
+ "cache_dtype": "float16",
13
+ "cache_size": 262144,
14
  "cache_type": "FIFO",
15
+ "compression_factor": 8,
16
  "context_size": 2,
17
  "global_cache": true,
18
  "inference_mode": true,
 
23
  },
24
  "similarity_fn": "l2",
25
  "task_type": "CAUSAL_LM",
26
+ "topk": 8
27
+ }
neurocache_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c08bbc22b8e9b4e668cf7c5de2273afcd65c1bc54cd5173d15eb2cf82024316
3
- size 271603948
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0fd68f49caff8bd0d959814adaa7969184d1dfdf4bd1a1e9d7e88aa04fca9dc
3
+ size 429031630