a23b28e87c78bf67e98c42e062c47e81605553c10ea3b54943fb1d265201b2b1
Browse files- config.json +1 -1
- plots.png +0 -0
- smash_config.json +1 -1
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "/tmp/
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "/tmp/tmp5wtl9eyu",
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
plots.png
CHANGED
|
|
smash_config.json
CHANGED
|
@@ -8,7 +8,7 @@
|
|
| 8 |
"compilers": "None",
|
| 9 |
"task": "text_text_generation",
|
| 10 |
"device": "cuda",
|
| 11 |
-
"cache_dir": "/ceph/hdd/staff/charpent/.cache/
|
| 12 |
"batch_size": 1,
|
| 13 |
"model_name": "deepseek-ai/deepseek-coder-1.3b-base",
|
| 14 |
"pruning_ratio": 0.0,
|
|
|
|
| 8 |
"compilers": "None",
|
| 9 |
"task": "text_text_generation",
|
| 10 |
"device": "cuda",
|
| 11 |
+
"cache_dir": "/ceph/hdd/staff/charpent/.cache/models_mz80ni7",
|
| 12 |
"batch_size": 1,
|
| 13 |
"model_name": "deepseek-ai/deepseek-coder-1.3b-base",
|
| 14 |
"pruning_ratio": 0.0,
|