07de90711906c8a0e5350b297b1288ccf59e2b2f602eeef2f7a7cd840c4ce73f
Browse files- config.json +1 -1
- plots.png +0 -0
- smash_config.json +1 -1
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "/tmp/
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "/tmp/tmpe70gy4hp",
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
plots.png
CHANGED
|
|
smash_config.json
CHANGED
|
@@ -8,7 +8,7 @@
|
|
| 8 |
"compilers": "None",
|
| 9 |
"task": "text_text_generation",
|
| 10 |
"device": "cuda",
|
| 11 |
-
"cache_dir": "/ceph/hdd/staff/charpent/.cache/
|
| 12 |
"batch_size": 1,
|
| 13 |
"model_name": "deepseek-ai/deepseek-coder-1.3b-instruct",
|
| 14 |
"pruning_ratio": 0.0,
|
|
|
|
| 8 |
"compilers": "None",
|
| 9 |
"task": "text_text_generation",
|
| 10 |
"device": "cuda",
|
| 11 |
+
"cache_dir": "/ceph/hdd/staff/charpent/.cache/modelswwxyp9hy",
|
| 12 |
"batch_size": 1,
|
| 13 |
"model_name": "deepseek-ai/deepseek-coder-1.3b-instruct",
|
| 14 |
"pruning_ratio": 0.0,
|