Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

README.md +8 -8
comparison_graph.png +0 -0
config.json +6 -3
generation_config.json +2 -1
model.safetensors +2 -2
tokenizer.json +2 -2
tokenizer_config.json +7 -217

README.md CHANGED Viewed

@@ -12,7 +12,7 @@ pipeline_tag: text-generation
 # Qwen3-0.6B-python-safe
-> 🎯 **PYTHON-optimized** | 📦 **Safe** pruning | ⚡ **1% weights pruned**
 This model is a **conservatively pruned** version of [Qwen/Qwen3-0.6B](https://huggingface.co/Qwen/Qwen3-0.6B), specialized for **PYTHON** tasks using activation-aware weight pruning (Wanda-style).
@@ -20,7 +20,7 @@ This model is a **conservatively pruned** version of [Qwen/Qwen3-0.6B](https://h
 - **Specialization**: Optimized for Python tasks
 - **Pruning Method**: Wanda-style (|W| × |activation|) importance scoring
-- **Size Reduction**: 1% weights pruned
 - **Use Case**: High accuracy retention, ideal for production use
 ## 📊 Performance Comparison
@@ -30,13 +30,13 @@ This model is a **conservatively pruned** version of [Qwen/Qwen3-0.6B](https://h
 | **Python** | 30.0% | 30.0% ⭐ | → |
 | Html | 0.0% | 0.0% | → |
 | Trivia | 90.0% | 90.0% | → |
-| Math | 96.7% | 93.3% | ↓ 3.3% |
 | Reasoning | 36.7% | 36.7% | → |
-| Medical | 83.3% | 86.7% | ↑ 3.3% |
-| Linux | 93.3% | 93.3% | → |
-| Writing | 53.3% | 56.7% | ↑ 3.3% |
-**Average**: 60.4% → 60.8% (+0.4%)
 **Python Retention**: 100.0% of original performance
@@ -64,7 +64,7 @@ print(tokenizer.decode(outputs[0], skip_special_tokens=True))
 | Specialization | Python |
 | Prune Mode | Safe |
 | Pruning Method | Activation-based weight pruning (Wanda) |
-| Weight Reduction | 1% weights pruned |
 ## 🔗 Related Models

 # Qwen3-0.6B-python-safe
+> 🎯 **PYTHON-optimized** | 📦 **Safe** pruning | ⚡ **2% weights pruned**
 This model is a **conservatively pruned** version of [Qwen/Qwen3-0.6B](https://huggingface.co/Qwen/Qwen3-0.6B), specialized for **PYTHON** tasks using activation-aware weight pruning (Wanda-style).
 - **Specialization**: Optimized for Python tasks
 - **Pruning Method**: Wanda-style (|W| × |activation|) importance scoring
+- **Size Reduction**: 2% weights pruned
 - **Use Case**: High accuracy retention, ideal for production use
 ## 📊 Performance Comparison
 | **Python** | 30.0% | 30.0% ⭐ | → |
 | Html | 0.0% | 0.0% | → |
 | Trivia | 90.0% | 90.0% | → |
+| Math | 96.7% | 96.7% | → |
 | Reasoning | 36.7% | 36.7% | → |
+| Medical | 83.3% | 83.3% | → |
+| Linux | 93.3% | 90.0% | ↓ 3.3% |
+| Writing | 53.3% | 53.3% | → |
+**Average**: 60.4% → 60.0% (-0.4%)
 **Python Retention**: 100.0% of original performance
 | Specialization | Python |
 | Prune Mode | Safe |
 | Pruning Method | Activation-based weight pruning (Wanda) |
+| Weight Reduction | 2% weights pruned |
 ## 🔗 Related Models

comparison_graph.png CHANGED Viewed

config.json CHANGED Viewed

@@ -48,12 +48,15 @@
   "num_attention_heads": 16,
   "num_hidden_layers": 28,
   "num_key_value_heads": 8,
   "rms_norm_eps": 1e-06,
-  "rope_scaling": null,
-  "rope_theta": 1000000,
   "sliding_window": null,
   "tie_word_embeddings": true,
-  "transformers_version": "4.57.6",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

   "num_attention_heads": 16,
   "num_hidden_layers": 28,
   "num_key_value_heads": 8,
+  "pad_token_id": null,
   "rms_norm_eps": 1e-06,
+  "rope_parameters": {
+    "rope_theta": 1000000,
+    "rope_type": "default"
+  },
   "sliding_window": null,
   "tie_word_embeddings": true,
+  "transformers_version": "5.0.0",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

generation_config.json CHANGED Viewed

@@ -1,9 +1,10 @@
 {
   "bos_token_id": 151643,
   "eos_token_id": [
     151645,
     151643
   ],
   "pad_token_id": 151643,
-  "transformers_version": "4.57.6"
 }

 {
   "bos_token_id": 151643,
+  "do_sample": false,
   "eos_token_id": [
     151645,
     151643
   ],
   "pad_token_id": 151643,
+  "transformers_version": "5.0.0"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d4e986e264eec11cb280bcab9c4592f081d35918421e069483071c316a5b6b20
-size 1192134784

 version https://git-lfs.github.com/spec/v1
+oid sha256:4850d9e7783a1ad308c0a8eafcbc093a2666f5403f153835a9a8d5ad668eb2a9
+size 1503300016

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dab3ef598a088c1ffec65f944ad95060dd22f3de49a128a0e30dcd20364f22ef
-size 11422921

 version https://git-lfs.github.com/spec/v1
+oid sha256:fea4f89c198c65a418ebfd87d7480db83fe21f31c7f56cd2ecea1110b1dff53e
+size 11422917

tokenizer_config.json CHANGED Viewed

@@ -1,217 +1,11 @@
 {
-  "add_bos_token": false,
   "add_prefix_space": false,
-  "added_tokens_decoder": {
-    "151643": {
-      "content": "<|endoftext|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151644": {
-      "content": "<|im_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151645": {
-      "content": "<|im_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151646": {
-      "content": "<|object_ref_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151647": {
-      "content": "<|object_ref_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151648": {
-      "content": "<|box_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151649": {
-      "content": "<|box_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151650": {
-      "content": "<|quad_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151651": {
-      "content": "<|quad_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151652": {
-      "content": "<|vision_start|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151653": {
-      "content": "<|vision_end|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151654": {
-      "content": "<|vision_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151655": {
-      "content": "<|image_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151656": {
-      "content": "<|video_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "151657": {
-      "content": "<tool_call>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151658": {
-      "content": "</tool_call>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151659": {
-      "content": "<|fim_prefix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151660": {
-      "content": "<|fim_middle|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151661": {
-      "content": "<|fim_suffix|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151662": {
-      "content": "<|fim_pad|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151663": {
-      "content": "<|repo_name|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151664": {
-      "content": "<|file_sep|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151665": {
-      "content": "<tool_response>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151666": {
-      "content": "</tool_response>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151667": {
-      "content": "<think>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "151668": {
-      "content": "</think>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    }
-  },
-  "additional_special_tokens": [
     "<|im_start|>",
     "<|im_end|>",
     "<|object_ref_start|>",
@@ -226,11 +20,7 @@
     "<|image_pad|>",
     "<|video_pad|>"
   ],
-  "bos_token": null,
-  "clean_up_tokenization_spaces": false,
-  "eos_token": "<|im_end|>",
-  "errors": "replace",
-  "extra_special_tokens": {},
   "model_max_length": 131072,
   "pad_token": "<|endoftext|>",
   "split_special_tokens": false,

 {
   "add_prefix_space": false,
+  "backend": "tokenizers",
+  "bos_token": null,
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|im_end|>",
+  "errors": "replace",
+  "extra_special_tokens": [
     "<|im_start|>",
     "<|im_end|>",
     "<|object_ref_start|>",
     "<|image_pad|>",
     "<|video_pad|>"
   ],
+  "is_local": false,
   "model_max_length": 131072,
   "pad_token": "<|endoftext|>",
   "split_special_tokens": false,