Upload folder using huggingface_hub
Browse files- README.md +5 -19
- compress_config.json +1 -1
- delta_config.json +1 -1
- deltazip-compressed.safetensors +2 -2
- tokenizer.json +2 -2
README.md
CHANGED
|
@@ -26,14 +26,7 @@ This is a compressed model using [deltazip](https://github.com/eth-easl/deltazip
|
|
| 26 |
#### Prompt:
|
| 27 |
|
| 28 |
```
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
Cutting Knowledge Date: December 2023
|
| 32 |
-
Today Date: 04 Dec 2024
|
| 33 |
-
|
| 34 |
-
<|eot_id|><|start_header_id|>user<|end_header_id|>
|
| 35 |
-
|
| 36 |
-
Who is Alan Turing?<|eot_id|>
|
| 37 |
```
|
| 38 |
|
| 39 |
#### Output:
|
|
@@ -42,22 +35,15 @@ Who is Alan Turing?<|eot_id|>
|
|
| 42 |
<|begin_of_text|><|start_header_id|>system<|end_header_id|>
|
| 43 |
|
| 44 |
Cutting Knowledge Date: December 2023
|
| 45 |
-
Today Date:
|
| 46 |
-
|
| 47 |
-
<|eot_id|><|start_header_id|>user<|end_header_id|>
|
| 48 |
-
|
| 49 |
-
<|begin_of_text|><|start_header_id|>system<|end_header_id|>
|
| 50 |
-
|
| 51 |
-
Cutting Knowledge Date: December 2023
|
| 52 |
-
Today Date: 04 Dec 2024
|
| 53 |
|
| 54 |
<|eot_id|><|start_header_id|>user<|end_header_id|>
|
| 55 |
|
| 56 |
-
Who is Alan Turing?<|eot_id|><|
|
| 57 |
|
| 58 |
-
Alan Turing (1912-1954) was a British mathematician, computer scientist, logician, and philosopher. He is widely
|
| 59 |
|
| 60 |
-
Turing was born in London, England, and
|
| 61 |
```
|
| 62 |
|
| 63 |
## Evaluation
|
|
|
|
| 26 |
#### Prompt:
|
| 27 |
|
| 28 |
```
|
| 29 |
+
[{'role': 'user', 'content': 'Who is Alan Turing?'}]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 30 |
```
|
| 31 |
|
| 32 |
#### Output:
|
|
|
|
| 35 |
<|begin_of_text|><|start_header_id|>system<|end_header_id|>
|
| 36 |
|
| 37 |
Cutting Knowledge Date: December 2023
|
| 38 |
+
Today Date: 05 Dec 2024
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
|
| 40 |
<|eot_id|><|start_header_id|>user<|end_header_id|>
|
| 41 |
|
| 42 |
+
Who is Alan Turing?<|eot_id|><|start_header_id|>assistant<|end_header_id|>
|
| 43 |
|
| 44 |
+
Alan Turing (1912-1954) was a British mathematician, computer scientist, logician, and philosopher. He is widely regarded as one of the most influential figures in the development of computer science, artificial intelligence, and cryptography.
|
| 45 |
|
| 46 |
+
Turing was born in London, England, and studied mathematics at King's College, Cambridge. During World War II, he worked at the Government Code and Cypher School (GC&CS) at
|
| 47 |
```
|
| 48 |
|
| 49 |
## Evaluation
|
compress_config.json
CHANGED
|
@@ -4,7 +4,7 @@
|
|
| 4 |
"sparsity": 0.5,
|
| 5 |
"damp_percent": 0.01,
|
| 6 |
"desc_act": false,
|
| 7 |
-
"sym":
|
| 8 |
"true_sequential": true,
|
| 9 |
"lossless": "none",
|
| 10 |
"prunen": 2,
|
|
|
|
| 4 |
"sparsity": 0.5,
|
| 5 |
"damp_percent": 0.01,
|
| 6 |
"desc_act": false,
|
| 7 |
+
"sym": true,
|
| 8 |
"true_sequential": true,
|
| 9 |
"lossless": "none",
|
| 10 |
"prunen": 2,
|
delta_config.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"base_model": "meta-llama/Llama-3.2-3B", "compress_config": {"bits": 4, "group_size": -1, "sparsity": 0.5, "damp_percent": 0.01, "desc_act": false, "sym":
|
|
|
|
| 1 |
+
{"base_model": "meta-llama/Llama-3.2-3B", "compress_config": {"bits": 4, "group_size": -1, "sparsity": 0.5, "damp_percent": 0.01, "desc_act": false, "sym": true, "true_sequential": true, "lossless": "none", "prunen": 2, "prunem": 4, "block_size": 128}, "target_modules": ["self_attn.k_proj", "self_attn.v_proj", "self_attn.q_proj", "self_attn.o_proj", "mlp.up_proj", "mlp.gate_proj", "mlp.down_proj"]}
|
deltazip-compressed.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:703a384792cf21021a4f6d089349b07b3eb5aa458443e47c1395e9486d9b6533
|
| 3 |
+
size 2634561712
|
tokenizer.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b
|
| 3 |
+
size 17209920
|