diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f9a2955f6f21606fab6351bae7803abd139a26a4 --- /dev/null +++ b/config.json @@ -0,0 +1 @@ +{"sae": {"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false}, "batch_size": 32, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["layers.0", "layers.1", "layers.2", "layers.3", "layers.4", "layers.5", "layers.6", "layers.7", "layers.8", "layers.9", "layers.10", "layers.11", "layers.12", "layers.13", "layers.14", "layers.15", "layers.16", "layers.17", "layers.18", "layers.19", "layers.20", "layers.21", "layers.22", "layers.23", "layers.24", "layers.25", "layers.26", "layers.27"], "layers": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27], "layer_stride": 1, "distribute_modules": false, "save_every": 1000, "log_to_wandb": true, "run_name": null, "wandb_log_frequency": 1, "model": "Qwen/Qwen2.5-Coder-1.5B-Instruct", "dataset": "nguyentruong-ins/codeforces_cpp_cleaned_scaled_class", "split": "train", "ctx_len": 2048, "hf_token": null, "load_in_8bit": false, "max_examples": null, "resume": false, "seed": 42, "data_preprocessing_num_proc": 24} \ No newline at end of file diff --git a/layers.0/cfg.json b/layers.0/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.0/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.0/sae.safetensors b/layers.0/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..144a3e1fe9a3b130208e8518bd7583b49c2a65d3 --- /dev/null +++ b/layers.0/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39880181f031fbc68a510345d568802e9fd5caaff0b546e2ba2e4fa7e9f6d01 +size 151050568 diff --git a/layers.1/cfg.json b/layers.1/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.1/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.1/sae.safetensors b/layers.1/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eba6a3cf0abedeb0dc84f47f634aa5d65b9ff50f --- /dev/null +++ b/layers.1/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6656820213ca89a620e217deac9ee3c7230b5188c454d9e40fff0e66fe8e0dad +size 151050568 diff --git a/layers.10/cfg.json b/layers.10/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.10/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.10/sae.safetensors b/layers.10/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..608ce492279c25205d304457b5b5278539e2bdb1 --- /dev/null +++ b/layers.10/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f60f22a8cf94b80cb82ccd275aa422f9af36d36771e8a340ff6a723228976b8 +size 151050568 diff --git a/layers.11/cfg.json b/layers.11/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.11/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.11/sae.safetensors b/layers.11/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4814d1d437c25959d7c1baff6771405f96e6de2d --- /dev/null +++ b/layers.11/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e706849914760e9a000d03b3afb104140f8cf909f66397ed9e46ab73db1ce0 +size 151050568 diff --git a/layers.12/cfg.json b/layers.12/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.12/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.12/sae.safetensors b/layers.12/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bd1627276aaa3b8f53fd043d4d274d520df104b --- /dev/null +++ b/layers.12/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bacb8f558bfcbe18437cbfd1d6220cec83beb456c06d69c295058e010c6c32a +size 151050568 diff --git a/layers.13/cfg.json b/layers.13/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.13/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.13/sae.safetensors b/layers.13/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5926aff31eba0af70d9dc7405afb631fa49e3093 --- /dev/null +++ b/layers.13/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9a72de125ffca731f29f54436ff27aa5d78a019fb86c316ef395e1b3d2429e +size 151050568 diff --git a/layers.14/cfg.json b/layers.14/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.14/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.14/sae.safetensors b/layers.14/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4be599a9aca5ead07e8ae237366cee6d9d76bcea --- /dev/null +++ b/layers.14/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653b5b0758420b429aab15c44d205b984fe9b192907f176fa75b615558d91759 +size 151050568 diff --git a/layers.15/cfg.json b/layers.15/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.15/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.15/sae.safetensors b/layers.15/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bdc89203abf68d7b036a2d22f1f1216d05c67c43 --- /dev/null +++ b/layers.15/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db2e3e39deaecc67ade3d7d022a15840e907fa17f95baa20407d46449fe9c5a +size 151050568 diff --git a/layers.16/cfg.json b/layers.16/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.16/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.16/sae.safetensors b/layers.16/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..820f4c33e42cbc3f582422fa271cb8c739d456dd --- /dev/null +++ b/layers.16/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:026a09ed2be59d8add071b7e1afed28e394868cd3546e6d32d1e89856e731297 +size 151050568 diff --git a/layers.17/cfg.json b/layers.17/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.17/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.17/sae.safetensors b/layers.17/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4cc8f0c52bf6fcce910f366c2088a39abc06366b --- /dev/null +++ b/layers.17/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b688a9c19feb02ecac969dc5bebfd4a19531d8c28235bc58c79d7c26e29833 +size 151050568 diff --git a/layers.18/cfg.json b/layers.18/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.18/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.18/sae.safetensors b/layers.18/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5857177468d194c0212d019ceaab3ba5b037f84 --- /dev/null +++ b/layers.18/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cad28c3f09f6b5f7cd0ab9092c0191eafaded76e96c980e3e2b588b57e8def2 +size 151050568 diff --git a/layers.19/cfg.json b/layers.19/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.19/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.19/sae.safetensors b/layers.19/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37d95f59f5e84f1489064e3974ca93013834e2f5 --- /dev/null +++ b/layers.19/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb692927b7b0822c72a03a9c77f91ffd7a6d2dbc51bfd083a9782eeb57eac310 +size 151050568 diff --git a/layers.2/cfg.json b/layers.2/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.2/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.2/sae.safetensors b/layers.2/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b9b34aea0eb2fe06ec91c09d855be0be83229cc --- /dev/null +++ b/layers.2/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d2e06b0b875d104083abe36e2c1639a4aa0106594d0bbff8920011333050f4 +size 151050568 diff --git a/layers.20/cfg.json b/layers.20/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.20/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.20/sae.safetensors b/layers.20/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38a36dac78daeaa141c1eb864009089e68dbb5eb --- /dev/null +++ b/layers.20/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa58103ed27c842bb7705231eebb996e3fb79ebc383905de5fb8c49bd92cd39 +size 151050568 diff --git a/layers.21/cfg.json b/layers.21/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.21/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.21/sae.safetensors b/layers.21/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..553d7a92338455bb65da5ed60b374207e91d8ce6 --- /dev/null +++ b/layers.21/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb4bd9cfc846a7a4a79acf3c04ce755d09a4c27fca15d1554b50a5cccd111d9 +size 151050568 diff --git a/layers.22/cfg.json b/layers.22/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.22/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.22/sae.safetensors b/layers.22/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6c2bb9f73a6dce370f34a2c53fba6d3733d35c82 --- /dev/null +++ b/layers.22/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077bfc58ca19cf2ba2093b035a0b88c0dc0233e0b347a5661a51ccafea87a206 +size 151050568 diff --git a/layers.23/cfg.json b/layers.23/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.23/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.23/sae.safetensors b/layers.23/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c49e83a9d4d28d566e7cf8acbc3b44e9e82c0fb7 --- /dev/null +++ b/layers.23/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b36d801dc9c800583283b44e98771781e852f0f07b84526c914bc9fa18ff7ed +size 151050568 diff --git a/layers.24/cfg.json b/layers.24/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.24/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.24/sae.safetensors b/layers.24/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..112818b4866b3268a53d9f762e1cb2f9e3b64b6e --- /dev/null +++ b/layers.24/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef7e75d4d1b28cf67df09363f8dc4bcb06b02784ef6d2d27759d9f78754b2de +size 151050568 diff --git a/layers.25/cfg.json b/layers.25/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.25/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.25/sae.safetensors b/layers.25/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d815515fd9e736958104a26d56ae5009595dc7a --- /dev/null +++ b/layers.25/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bbf1d2dd0a5026d97c4173fdc26153203a2e64cb89b2764c8fcc70016ee991 +size 151050568 diff --git a/layers.26/cfg.json b/layers.26/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.26/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.26/sae.safetensors b/layers.26/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fafa58672d882b7e28fc7cb16dfd7861258ad94 --- /dev/null +++ b/layers.26/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ca88aa0f30f1c078af14b6f90f777331f7d8a1d65fa23cea5d459673465f6a +size 151050568 diff --git a/layers.27/cfg.json b/layers.27/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.27/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.27/sae.safetensors b/layers.27/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b687a7a505b281acd59b3d23af5be3d51e60e4da --- /dev/null +++ b/layers.27/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d19ff41f7177623c15386af09827b877e179ff964e9df409c06525b44f8be2 +size 151050568 diff --git a/layers.3/cfg.json b/layers.3/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.3/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.3/sae.safetensors b/layers.3/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1fb83367ccadc16dfea61c769787275a678afe55 --- /dev/null +++ b/layers.3/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5f8230f650287b6d9347b2691b3589756a62d123c6efba8aea51bfff1cdd39 +size 151050568 diff --git a/layers.4/cfg.json b/layers.4/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.4/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.4/sae.safetensors b/layers.4/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b91ae0eff918a8b37a52e3cd9d441471c8151c17 --- /dev/null +++ b/layers.4/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8937fcac0971021d239e08041ae55e92fde123a6a1dedb8fdcddeed03ce92376 +size 151050568 diff --git a/layers.5/cfg.json b/layers.5/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.5/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.5/sae.safetensors b/layers.5/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..047f213122390f57983b840dfcb174b8c7e3266c --- /dev/null +++ b/layers.5/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2255a6ec48dbb9481394659a11d3c642ce63cafb0f5bb674c435b0e31a2068a0 +size 151050568 diff --git a/layers.6/cfg.json b/layers.6/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.6/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.6/sae.safetensors b/layers.6/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9effb5cff3b56fbcacdb51c862b37a7b18c16b4 --- /dev/null +++ b/layers.6/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e3ca656028f54e08cc13223cf7a17d55d088a832d5c55f77d62baceb6008dc +size 151050568 diff --git a/layers.7/cfg.json b/layers.7/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.7/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.7/sae.safetensors b/layers.7/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7deee1765b7aa1549b202d52bfca1b33f9ca667f --- /dev/null +++ b/layers.7/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d958d29062795f00468105b396717ef446de9bbb9b0d16457b917a47079440 +size 151050568 diff --git a/layers.8/cfg.json b/layers.8/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.8/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.8/sae.safetensors b/layers.8/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee006f99df11efc9a276483e78e5d339afa1e8ce --- /dev/null +++ b/layers.8/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be63cb6dd77589bf45382ae6d472216ed7815ab0aa5a6920e1d01d312d1a7b8 +size 151050568 diff --git a/layers.9/cfg.json b/layers.9/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc49f1b73a3a5514c7540038266ba638ef7ae7b --- /dev/null +++ b/layers.9/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 8, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 1536} \ No newline at end of file diff --git a/layers.9/sae.safetensors b/layers.9/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aa77a04fde12a3dad7e6c93d81a63e8436450da6 --- /dev/null +++ b/layers.9/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b09277371bf20fb128445ba65e4c9fbaf0fb86a1e77d22e63bb705726b1beba +size 151050568 diff --git a/lr_scheduler.pt b/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b4200b4d10356d7982d1af568e9365839908fe --- /dev/null +++ b/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dde87a8e3079ed147bca886c8df4d981d9e856d8379bc3ba3ffabbd9efc72b5 +size 1588 diff --git a/optimizer.pt b/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..083adb511ca3394f7f74382e49631c16f6c76774 --- /dev/null +++ b/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba37caa0fcb08aed1bb72e666d7521c77eb411f793016575a69f5a15a8b80237 +size 8458912622 diff --git a/state.pt b/state.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd797dad05b8f80bd245c74d2df142f4bb58f73d --- /dev/null +++ b/state.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52397a1f0dcc23325c48d45aada6966ba0c95149cd29fcb8e05ce17d97a7f126 +size 2759106