Upload folder using huggingface_hub

Files changed (10) hide show

layer_2/k_128/trainer_0/ae.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:606bb3fd1f5583f4dda6a2b605a6e463837e7f29d2349aec1b23023f5fc38da8
+size 118091993

layer_2/k_128/trainer_0/config.json ADDED Viewed

+{
+    "trainer": {
+        "trainer_class": "TopKTrainer",
+        "dict_class": "AutoEncoderTopK",
+        "lr": 1e-05,
+        "steps": 10000,
+        "auxk_alpha": 0.03125,
+        "warmup_steps": 500,
+        "decay_start": null,
+        "threshold_beta": 0.999,
+        "threshold_start_step": 1000,
+        "seed": null,
+        "activation_dim": 480,
+        "dict_size": 30720,
+        "k": 128,
+        "device": "cuda",
+        "layer": 2,
+        "lm_name": "yangheng/PlantRNA-FM",
+        "wandb_name": "plantrnafm-layer-2-k-128_trainer_0",
+        "submodule_name": null
+    },
+    "buffer": {
+        "d_submodule": 480,
+        "io": "out",
+        "n_ctxs": 100,
+        "ctx_len": 128,
+        "refresh_batch_size": 64,
+        "out_batch_size": 1024,
+        "device": "cuda"
+    }
+}

layer_2/k_256/trainer_0/ae.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:32237c44bf01cde70658bc7a89ecb0a6335ba3192ba67fd87874baa4cc3eb955
+size 118091993

layer_2/k_256/trainer_0/config.json ADDED Viewed

+{
+    "trainer": {
+        "trainer_class": "TopKTrainer",
+        "dict_class": "AutoEncoderTopK",
+        "lr": 1e-05,
+        "steps": 10000,
+        "auxk_alpha": 0.03125,
+        "warmup_steps": 500,
+        "decay_start": null,
+        "threshold_beta": 0.999,
+        "threshold_start_step": 1000,
+        "seed": null,
+        "activation_dim": 480,
+        "dict_size": 30720,
+        "k": 256,
+        "device": "cuda",
+        "layer": 2,
+        "lm_name": "yangheng/PlantRNA-FM",
+        "wandb_name": "plantrnafm-layer-2-k-256_trainer_0",
+        "submodule_name": null
+    },
+    "buffer": {
+        "d_submodule": 480,
+        "io": "out",
+        "n_ctxs": 100,
+        "ctx_len": 128,
+        "refresh_batch_size": 64,
+        "out_batch_size": 1024,
+        "device": "cuda"
+    }
+}

layer_2/k_32/trainer_0/ae.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0dfb1b820cf8fad633445faa388ba84ebd1f025ae6e42f72b30d73885a186df
+size 118091993

layer_2/k_32/trainer_0/config.json ADDED Viewed

+{
+    "trainer": {
+        "trainer_class": "TopKTrainer",
+        "dict_class": "AutoEncoderTopK",
+        "lr": 1e-05,
+        "steps": 10000,
+        "auxk_alpha": 0.03125,
+        "warmup_steps": 500,
+        "decay_start": null,
+        "threshold_beta": 0.999,
+        "threshold_start_step": 1000,
+        "seed": null,
+        "activation_dim": 480,
+        "dict_size": 30720,
+        "k": 32,
+        "device": "cuda",
+        "layer": 2,
+        "lm_name": "yangheng/PlantRNA-FM",
+        "wandb_name": "plantrnafm-layer-2-k-32_trainer_0",
+        "submodule_name": null
+    },
+    "buffer": {
+        "d_submodule": 480,
+        "io": "out",
+        "n_ctxs": 100,
+        "ctx_len": 128,
+        "refresh_batch_size": 64,
+        "out_batch_size": 1024,
+        "device": "cuda"
+    }
+}

layer_2/k_512/trainer_0/ae.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:69ae55d82cc9f07a0ddb209eb598444dada29e2091b7840a8dc97ddedecbef8e
+size 118091993

layer_2/k_512/trainer_0/config.json ADDED Viewed

+{
+    "trainer": {
+        "trainer_class": "TopKTrainer",
+        "dict_class": "AutoEncoderTopK",
+        "lr": 1e-05,
+        "steps": 10000,
+        "auxk_alpha": 0.03125,
+        "warmup_steps": 500,
+        "decay_start": null,
+        "threshold_beta": 0.999,
+        "threshold_start_step": 1000,
+        "seed": null,
+        "activation_dim": 480,
+        "dict_size": 30720,
+        "k": 512,
+        "device": "cuda",
+        "layer": 2,
+        "lm_name": "yangheng/PlantRNA-FM",
+        "wandb_name": "plantrnafm-layer-2-k-512_trainer_0",
+        "submodule_name": null
+    },
+    "buffer": {
+        "d_submodule": 480,
+        "io": "out",
+        "n_ctxs": 100,
+        "ctx_len": 128,
+        "refresh_batch_size": 64,
+        "out_batch_size": 1024,
+        "device": "cuda"
+    }
+}

layer_2/k_64/trainer_0/ae.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e23245d31fe1f7d11fcfb998a0d974c5527053184b42846522c1e6151fb07976
+size 118091993

layer_2/k_64/trainer_0/config.json ADDED Viewed

+{
+    "trainer": {
+        "trainer_class": "TopKTrainer",
+        "dict_class": "AutoEncoderTopK",
+        "lr": 1e-05,
+        "steps": 10000,
+        "auxk_alpha": 0.03125,
+        "warmup_steps": 500,
+        "decay_start": null,
+        "threshold_beta": 0.999,
+        "threshold_start_step": 1000,
+        "seed": null,
+        "activation_dim": 480,
+        "dict_size": 30720,
+        "k": 64,
+        "device": "cuda",
+        "layer": 2,
+        "lm_name": "yangheng/PlantRNA-FM",
+        "wandb_name": "plantrnafm-layer-2-k-64_trainer_0",
+        "submodule_name": null
+    },
+    "buffer": {
+        "d_submodule": 480,
+        "io": "out",
+        "n_ctxs": 100,
+        "ctx_len": 128,
+        "refresh_batch_size": 64,
+        "out_batch_size": 1024,
+        "device": "cuda"
+    }
+}