okletsgg commited on
Commit
1d81654
·
verified ·
1 Parent(s): 2e6f723

Upload model_info.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. model_info.json +34 -0
model_info.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "MiniCPM4-0.5B-RKLLM",
3
+ "versions": [
4
+ {
5
+ "name": "GPTQ-32",
6
+ "file": "MiniCPM4-0.5B-QAT-Int4-GPTQ-format_w4a16_g32_RK3576.rkllm",
7
+ "size": "471MB",
8
+ "embedding_support": "perfect",
9
+ "description": "GPTQ量化版本,完美支持embedding输入"
10
+ },
11
+ {
12
+ "name": "Per-Channel",
13
+ "file": "Minicpm4-0.5B-QAT-Int4-perChannel_w4a16_RK3576.rkllm",
14
+ "size": "414MB",
15
+ "embedding_support": "token_only",
16
+ "description": "Per-Channel量化版本,仅推荐token输入"
17
+ },
18
+ {
19
+ "name": "FP16-Original",
20
+ "file": "MiniCPM4-0.5B-fp16-v1.2.2b1.rkllm",
21
+ "size": "996MB",
22
+ "embedding_support": "inconsistent",
23
+ "description": "原始未量化版本,embedding输入不一致"
24
+ }
25
+ ],
26
+ "test_results": {
27
+ "gptq_cosine_similarity": 1.0,
28
+ "gptq_top50_overlap": "100%",
29
+ "per_channel_issue": "generates_eos_tokens",
30
+ "original_cosine_similarity": 0.59
31
+ },
32
+ "hardware": "RK3576",
33
+ "date": "2024-01"
34
+ }