diff --git a/latents/layers.0.mlp/0_26213.safetensors b/latents/layers.0.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99cad67e9fedf11815e3ffe48c0b92c3e4c9d13d --- /dev/null +++ b/latents/layers.0.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e350b6d5b35a952529413c6f4c91d16adec385c69b7886f0183fdc6583a1d3 +size 107301648 diff --git a/latents/layers.0.mlp/104857_131071.safetensors b/latents/layers.0.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f7edb20070c33fe2c2558f45a1cffdd1ac79daed --- /dev/null +++ b/latents/layers.0.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2309f75a68953cff0068a56434c4cee5f083f0d077455ca06241a408f37a2e +size 109044384 diff --git a/latents/layers.0.mlp/26214_52427.safetensors b/latents/layers.0.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3879c977a434399c7b9c849a525c1fcac4f0f3b1 --- /dev/null +++ b/latents/layers.0.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bbbca72561872b97d3bf86ab4eae465d766e8523fadbf242008060b466d863 +size 106639112 diff --git a/latents/layers.0.mlp/52428_78642.safetensors b/latents/layers.0.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bd93284c4f1e4e9635dc39a12a8c8bc1d707cf1 --- /dev/null +++ b/latents/layers.0.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ba79d34a60eb29c52e5122315d4fc7549cda57bba493f2e968aaf6f4ad3d8f +size 106279024 diff --git a/latents/layers.0.mlp/78643_104856.safetensors b/latents/layers.0.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c0363f073dacd1e497366b710ea5c2f3607b09d --- /dev/null +++ b/latents/layers.0.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2df0bea2e9e79c262f62d516a84e4cd2a752d8048b99f6b4662f620196396e +size 109546792 diff --git a/latents/layers.0.mlp/config.json b/latents/layers.0.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.0.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.1.mlp/0_26213.safetensors b/latents/layers.1.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0af9a47f49200b54324aaef874e9b0613df3a53d --- /dev/null +++ b/latents/layers.1.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221f8753bee310bce9f0c5a6917f6264c5eb0ce86b1d8f4c5c0d683e1dc09be4 +size 110911176 diff --git a/latents/layers.1.mlp/104857_131071.safetensors b/latents/layers.1.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf8a0a583cc04bd0a8e34c3e1a44e94016069401 --- /dev/null +++ b/latents/layers.1.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e55d621fec46ba7525d92b852b8f6f830dfc659ba4ad2c91bf43cfcc185f84 +size 110977304 diff --git a/latents/layers.1.mlp/26214_52427.safetensors b/latents/layers.1.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc66df6a18b4700e3afb0c11865bc229b1ccc2cf --- /dev/null +++ b/latents/layers.1.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9893fa5fba58f05ce62561a340bbb3d21a35fb96e590113911d97e58c2d5851 +size 108050288 diff --git a/latents/layers.1.mlp/52428_78642.safetensors b/latents/layers.1.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..228525bed46c15af221de57e7cfea8ab450b1654 --- /dev/null +++ b/latents/layers.1.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d928f8b03d620695844295e4e0bd8be4d95434ae6a2c3df8b6f8452cb41a895e +size 108531216 diff --git a/latents/layers.1.mlp/78643_104856.safetensors b/latents/layers.1.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2e0dee0fe8dd8e776be76120650e81fc3b0a0b1 --- /dev/null +++ b/latents/layers.1.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e1e233c867b7b73c019049cb928da88d697c4ce25e1884dde556e0a8258d94 +size 112747432 diff --git a/latents/layers.1.mlp/config.json b/latents/layers.1.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.1.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.10.mlp/0_26213.safetensors b/latents/layers.10.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4f867e30ad222b42ea5d7f71054f869225517ec --- /dev/null +++ b/latents/layers.10.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a85161acb075a57480de2eda37b185cd488d2512b5f2e6f901a0addb6911858 +size 108743648 diff --git a/latents/layers.10.mlp/104857_131071.safetensors b/latents/layers.10.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d227ae263dd0e5c594e838e8b8834f4493a14af9 --- /dev/null +++ b/latents/layers.10.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82632ab91e08815a503ba97c3e19bc37f18ff07d67140f75810910faf31af76b +size 108942520 diff --git a/latents/layers.10.mlp/26214_52427.safetensors b/latents/layers.10.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99360e802578efed573c60c0045e43f65f8de610 --- /dev/null +++ b/latents/layers.10.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:807ee3e54dc671ea4a6d558b2ce3e6b95db0d70fb112b3cce0a816f29781e233 +size 105453944 diff --git a/latents/layers.10.mlp/52428_78642.safetensors b/latents/layers.10.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..357dc3361b7923ac21984c8d8d136fb99e051deb --- /dev/null +++ b/latents/layers.10.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7bf09049c805443e7f8524186954edde69c4d9d6d8160b8ac65d92711ef1466 +size 107282560 diff --git a/latents/layers.10.mlp/78643_104856.safetensors b/latents/layers.10.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca8e939dc308b3d086a584286f2d44dfeff28691 --- /dev/null +++ b/latents/layers.10.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5aa210d214a55cb3ed996be637bc6276f2513625a618baf05f4f60f397400c5 +size 110569584 diff --git a/latents/layers.10.mlp/config.json b/latents/layers.10.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.10.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.11.mlp/0_26213.safetensors b/latents/layers.11.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..754bcfdb711720a4157d40d5eeeaf2a474ea446e --- /dev/null +++ b/latents/layers.11.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:691412dfd6f2292d95a912ed27d9e9a5a30ac98e3c02213919e87b7f7424b806 +size 109423056 diff --git a/latents/layers.11.mlp/104857_131071.safetensors b/latents/layers.11.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..965e1fd15c8bd18cb99f1a925e3de67c280741e5 --- /dev/null +++ b/latents/layers.11.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403257c9860b2cfaf4e0899bb129166872c9bbafd8749a04c6d7a42f34047db7 +size 108716384 diff --git a/latents/layers.11.mlp/26214_52427.safetensors b/latents/layers.11.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af2859e598b4f1bbe07a1ea2e0851fae24df4435 --- /dev/null +++ b/latents/layers.11.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04121c34b2d2e976cbf9bccfb12609724233499f108b6f3575dbdf1b1fb974f0 +size 111913584 diff --git a/latents/layers.11.mlp/52428_78642.safetensors b/latents/layers.11.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a518fd25dd1907ef348e0d7b9222b7b0e4ffaf56 --- /dev/null +++ b/latents/layers.11.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd3b5ae3c8f94541288133c2d968a7d9dd5316edc4885427b32a131bfdd6c51 +size 107561560 diff --git a/latents/layers.11.mlp/78643_104856.safetensors b/latents/layers.11.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5cb6813d8ff90165e43b2d525117639cf8d62940 --- /dev/null +++ b/latents/layers.11.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e2c71bd43171ff1cdd6c8817e4aae374454d4e4a12063145a87ef981f404a6 +size 111203144 diff --git a/latents/layers.11.mlp/config.json b/latents/layers.11.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.11.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.12.mlp/0_26213.safetensors b/latents/layers.12.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6237d705fe1d93dd80a5e5d9d97af9339973b20f --- /dev/null +++ b/latents/layers.12.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a171abaec5cfe84683925e24595df65578e4249b3d837c282e4569459c9600 +size 113396176 diff --git a/latents/layers.12.mlp/104857_131071.safetensors b/latents/layers.12.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..acb89224b0cc75262f9ab842eed14472edfb85e3 --- /dev/null +++ b/latents/layers.12.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840a30760acfd7ffe7a9a9ad9aeb42988094c029b26b28e66558d9f3d575c2d8 +size 111557120 diff --git a/latents/layers.12.mlp/26214_52427.safetensors b/latents/layers.12.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5af11a09d80bccb23807dbc91721728d4cc3570 --- /dev/null +++ b/latents/layers.12.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b3b115160769b434966613265b751487fce7bb71d89049fed98634094244bd +size 109583184 diff --git a/latents/layers.12.mlp/52428_78642.safetensors b/latents/layers.12.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35f1fda2d2677a2fbf46cc4e9c12d08d2be88a68 --- /dev/null +++ b/latents/layers.12.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb11c06810538aaf4a0448d868b1d2dda55f59383f1d1477ab967652427375b +size 105529168 diff --git a/latents/layers.12.mlp/78643_104856.safetensors b/latents/layers.12.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..859510f8a920e50b9033e10c8c7335e17f2b06eb --- /dev/null +++ b/latents/layers.12.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8f589e76ff9c8a1c41875816b958539077ea6c5d61b7246d6b428a4a03b8b7 +size 111475304 diff --git a/latents/layers.12.mlp/config.json b/latents/layers.12.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.12.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.13.mlp/0_26213.safetensors b/latents/layers.13.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..40b9fcbfef001aac06de11c4e85726c2f5574258 --- /dev/null +++ b/latents/layers.13.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f25bfe4fc2ffbccdaecad2287d1857450473130e64e96fd7002639da3e01e72 +size 109446144 diff --git a/latents/layers.13.mlp/104857_131071.safetensors b/latents/layers.13.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1825bdc74dfcf8780ef28e87b435bbc0afeac59b --- /dev/null +++ b/latents/layers.13.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791e3c8beee6e7728f8e34af8f6ba0c835751ceb2c78726c7b6bc5b3ab467e0e +size 113120168 diff --git a/latents/layers.13.mlp/26214_52427.safetensors b/latents/layers.13.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc0fda6175a057064758d2438d708bf7301f51e8 --- /dev/null +++ b/latents/layers.13.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206f2383604780a04552141c13b0fa9847e43d1ed87b0829c167d126eaf6f014 +size 111368760 diff --git a/latents/layers.13.mlp/52428_78642.safetensors b/latents/layers.13.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3ff677af0de2fbfb84a9658f8836bad9c8a6fe8 --- /dev/null +++ b/latents/layers.13.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994e20c8ef7b5c7156e174d47b5bc62af876ada5d0019b7f468fa22b47648cc7 +size 109394832 diff --git a/latents/layers.13.mlp/78643_104856.safetensors b/latents/layers.13.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5eea74a0ea800a8d21f69740cf9f3d22291805a4 --- /dev/null +++ b/latents/layers.13.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d95b92212690aabb2b3f4215fb4ab1251b15f50558de95ac898739d4782e12 +size 108328608 diff --git a/latents/layers.13.mlp/config.json b/latents/layers.13.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.13.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.14.mlp/0_26213.safetensors b/latents/layers.14.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4cf03abf6723f2d49fcfd4e71b51c70d30d46fb --- /dev/null +++ b/latents/layers.14.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ec55459c552fd2e1a560dddfa79da3011134a55f6db231891773e3cdd5c455 +size 110147648 diff --git a/latents/layers.14.mlp/104857_131071.safetensors b/latents/layers.14.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b65ac1771e0197d1bcd238361a3f10e2e7265d54 --- /dev/null +++ b/latents/layers.14.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1cda53fcd60b0e19b7db820aa4e3753d9a31871da13877ffa500475bd1dc5a +size 110410840 diff --git a/latents/layers.14.mlp/26214_52427.safetensors b/latents/layers.14.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7e1d9fc6523d18b0ec9077eeee213b3be6c51bd --- /dev/null +++ b/latents/layers.14.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f1aa0125ba961b41da465eaf6141bc44cb958259dedd353d822c1f3bd59279 +size 109638624 diff --git a/latents/layers.14.mlp/52428_78642.safetensors b/latents/layers.14.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee674dae39879cc4b29b8e04fa8034dcd24f4975 --- /dev/null +++ b/latents/layers.14.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6492dfbfb4556df153bdcb51d842be618006b6f75a0e87633d3639a65f2785f1 +size 107932232 diff --git a/latents/layers.14.mlp/78643_104856.safetensors b/latents/layers.14.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ae83436e2386a97c6152f97494f90a3da9d3cf9 --- /dev/null +++ b/latents/layers.14.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cbf762318d8ec012e292bedcd066d57afd4c683916c1434fba0eae61c4cbb62 +size 111437792 diff --git a/latents/layers.14.mlp/config.json b/latents/layers.14.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.14.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.15.mlp/0_26213.safetensors b/latents/layers.15.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af3b356f1c6f76b06183fd105d15fedaf94f5ddc --- /dev/null +++ b/latents/layers.15.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7f36353cfed3f360bb643577ce9e9271350b764b96292bce6d970fc79360e0 +size 55112120 diff --git a/latents/layers.15.mlp/104857_131071.safetensors b/latents/layers.15.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..867bea77d2e42525cbf910b936532bcee8bd8f10 --- /dev/null +++ b/latents/layers.15.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3755221bb8c87a46eb7fd293451909e34f6c8055fc942c4dee2916de8b57d8a5 +size 60528432 diff --git a/latents/layers.15.mlp/26214_52427.safetensors b/latents/layers.15.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2c09920cbfeac9567355ba82583c6048844cc13 --- /dev/null +++ b/latents/layers.15.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7348126ab3747610fe5da829fdf76f3e200f0aa7fd8adee9de98b204195cf471 +size 58377008 diff --git a/latents/layers.15.mlp/52428_78642.safetensors b/latents/layers.15.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c18091d9626e27b6563546c16aeb7fadc569ce7 --- /dev/null +++ b/latents/layers.15.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74e63e65c50b234f9c84d3f721c6561ae59d6f05265b1e56c215f4038bbbc60 +size 56487664 diff --git a/latents/layers.15.mlp/78643_104856.safetensors b/latents/layers.15.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..274daa39952317f814d6f0a44c4a1cb020166c0a --- /dev/null +++ b/latents/layers.15.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3f96cfd7f210e552c3999f1477d6bf06ab3f819a8691d2d5353431353362f4 +size 56942152 diff --git a/latents/layers.15.mlp/config.json b/latents/layers.15.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.15.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.2.mlp/0_26213.safetensors b/latents/layers.2.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7dd828534d4de13c9c287d139cdfbd7a2ea9d7cf --- /dev/null +++ b/latents/layers.2.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fef26c4f23e6db3c02badac2029e63aae267a7d6713f65d20322756d7a057594 +size 107833368 diff --git a/latents/layers.2.mlp/104857_131071.safetensors b/latents/layers.2.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fde4a46efa313c400faee8d5947dd6dd5e18ca49 --- /dev/null +++ b/latents/layers.2.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed6b15b4aab58855b241794492434ee17f0a1d192787a42488c495b69026512b +size 112214288 diff --git a/latents/layers.2.mlp/26214_52427.safetensors b/latents/layers.2.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7f136402bd03c2b04d07811b89950a73729016f --- /dev/null +++ b/latents/layers.2.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5916b15ecb8de19e7640c8d390dae0de9155bdaedd43ed9da95aeed17673ef4a +size 109290856 diff --git a/latents/layers.2.mlp/52428_78642.safetensors b/latents/layers.2.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fca5fba767e84ecd16cc77b2535eab8639af3843 --- /dev/null +++ b/latents/layers.2.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0303b2a72b12df317a749bc52c57e62f50d98a68503c21785cead369018ccb8 +size 107846704 diff --git a/latents/layers.2.mlp/78643_104856.safetensors b/latents/layers.2.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84e3291a3aa93c5edaef938b9f394de862c2f9dc --- /dev/null +++ b/latents/layers.2.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa0f0bd32b63032831be45b8586518f06f8de21ab8afbd8016cc0b6d9b72bbd4 +size 114489792 diff --git a/latents/layers.2.mlp/config.json b/latents/layers.2.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.2.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.3.mlp/0_26213.safetensors b/latents/layers.3.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5df6a498b6480b757c1e0c49538f0cfcb4e76776 --- /dev/null +++ b/latents/layers.3.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a25a6e4b0735229b78dc96bda8ec651ee34ff349cb00ad2f2a1c46f7683c6d3 +size 108315168 diff --git a/latents/layers.3.mlp/104857_131071.safetensors b/latents/layers.3.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0506d16c379f7e8cd6947d73f05e0263e5ebc98 --- /dev/null +++ b/latents/layers.3.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e78551f139a87e58a145908b4fb99c5eb3d442194a92ad71dea9af226badfa1 +size 108118656 diff --git a/latents/layers.3.mlp/26214_52427.safetensors b/latents/layers.3.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb30a8affe43330559e379ef46c4321e1c442822 --- /dev/null +++ b/latents/layers.3.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4915df7e86b6d003b7ef802ff599ca06a96bd09701ae86516a386eeee3031a4 +size 105770928 diff --git a/latents/layers.3.mlp/52428_78642.safetensors b/latents/layers.3.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d16a79410fcbb126c98625b348c2d60150b0035 --- /dev/null +++ b/latents/layers.3.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159c8af3d2d04f33650bc4fa4c60f361b05ff9ebb870d2eb7ddbeb6c0833d77b +size 112412440 diff --git a/latents/layers.3.mlp/78643_104856.safetensors b/latents/layers.3.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b2445a31693b8d35be8c036d38eaef85627d63b --- /dev/null +++ b/latents/layers.3.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32d9edbc1335d708c82183d048361a13cae2eb51f38639b4fbebc19382642d72 +size 104999448 diff --git a/latents/layers.3.mlp/config.json b/latents/layers.3.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.3.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.4.mlp/0_26213.safetensors b/latents/layers.4.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae4d237ecdb722775ab75678653f984916042e1d --- /dev/null +++ b/latents/layers.4.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d6dd63cfd18c83ab7055016cd9d039a5b1ce553665b1096381cd87af55ed02 +size 111537280 diff --git a/latents/layers.4.mlp/104857_131071.safetensors b/latents/layers.4.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93fc4f65ce0f59c204b0925821073783409205bc --- /dev/null +++ b/latents/layers.4.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2183042332e1e459bb20af6e0906f79780a950e998491e601dca999ba2b8d3ca +size 108898008 diff --git a/latents/layers.4.mlp/26214_52427.safetensors b/latents/layers.4.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f47d7e7d87914795535db9fbd5ede8ab024a56bb --- /dev/null +++ b/latents/layers.4.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e9403eb94f29221ccc65b64ac079f8757e6176430070499b1fe2913d07bcb34 +size 110143376 diff --git a/latents/layers.4.mlp/52428_78642.safetensors b/latents/layers.4.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7f6c2189bc3d4a75d4e3436a61937a532ed81cc --- /dev/null +++ b/latents/layers.4.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef11caad2879f13ed36b4c2d1bf436eec4603864df6c6bb94673883894a5af4 +size 109389192 diff --git a/latents/layers.4.mlp/78643_104856.safetensors b/latents/layers.4.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0203de864ad78cd89336f89c0438c21657d8fdcd --- /dev/null +++ b/latents/layers.4.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b49f1d88cb622a1016f897d4db6bd20a24c6f9ba64f3034f4d7e8450247d42 +size 110287488 diff --git a/latents/layers.4.mlp/config.json b/latents/layers.4.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.4.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.5.mlp/0_26213.safetensors b/latents/layers.5.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9922f38d68ce5f6e19f1367ec7c32925d5da19c9 --- /dev/null +++ b/latents/layers.5.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794495a846e12b320bc8d3f63173a053827a6ac3c10b0603a4391fe11eb45014 +size 98003456 diff --git a/latents/layers.5.mlp/104857_131071.safetensors b/latents/layers.5.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ca2cd0c896a4706e63075af46f6e7704ecc29e1 --- /dev/null +++ b/latents/layers.5.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6135f2328b01947b3f6ddd51444149ae1da1d5eb722969f7a9c6597de6ffaa53 +size 96742064 diff --git a/latents/layers.5.mlp/26214_52427.safetensors b/latents/layers.5.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4130a0ee66cae4e3302495471344e8e2e73b3927 --- /dev/null +++ b/latents/layers.5.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95becd39d590801f1dfc1d74c2c7026224c310e66c4ac5782adfb3c2f198d2d0 +size 96754760 diff --git a/latents/layers.5.mlp/52428_78642.safetensors b/latents/layers.5.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ddaf945b4a7a6f1791f036b7cd9fe2131a12051 --- /dev/null +++ b/latents/layers.5.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a12a796060f7c006f6404466c884ecf6bae4116e19afb7c24ded08098d3877b +size 96973448 diff --git a/latents/layers.5.mlp/78643_104856.safetensors b/latents/layers.5.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22d6c22afeb502e5acb4d5bab496c23bde10bff3 --- /dev/null +++ b/latents/layers.5.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df77a500a80674f6d3d2a5a6a4bfd461529182c2cf87f095c110961e9a252ff8 +size 98470688 diff --git a/latents/layers.5.mlp/config.json b/latents/layers.5.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.5.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.6.mlp/0_26213.safetensors b/latents/layers.6.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5bee9ce8acc33699000576cd4f935d44aaaf7926 --- /dev/null +++ b/latents/layers.6.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec69d6bc1250f74da4d130192897379c00cb5940726b24f53040555ca0e90ad +size 97041432 diff --git a/latents/layers.6.mlp/104857_131071.safetensors b/latents/layers.6.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1768945609345447b8c3f8f3221ad06880a48d42 --- /dev/null +++ b/latents/layers.6.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab2a4f336490d71ca26f78a3e49faf4406870ac2003d5ae23e87a60b08773c7 +size 94274296 diff --git a/latents/layers.6.mlp/26214_52427.safetensors b/latents/layers.6.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e970b6b23cb2b80db16501c06592fe2b22b8c8ed --- /dev/null +++ b/latents/layers.6.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d94e5b6ce554b61f073c5776db0bb6212510bba239d0b8570f851e40584902e +size 96426328 diff --git a/latents/layers.6.mlp/52428_78642.safetensors b/latents/layers.6.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be0e1fbed4c17152ac8b0522f959ce5a46840785 --- /dev/null +++ b/latents/layers.6.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e6298c5390a217a9b0d60d137f0fb40e50749a50002f9e6880a32ed16cf477 +size 94133432 diff --git a/latents/layers.6.mlp/78643_104856.safetensors b/latents/layers.6.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb3545de2a856fb1e7a9b0d0b3b0e7922c052d0a --- /dev/null +++ b/latents/layers.6.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb40fae3f7ece6a05b1360b12c2e8f7b6f6fa3c1a90a94a9986357b8ea4a3bcd +size 96685280 diff --git a/latents/layers.6.mlp/config.json b/latents/layers.6.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.6.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.7.mlp/0_26213.safetensors b/latents/layers.7.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd74b1a6b7b4e0f02501302b1940d41ba923c9ba --- /dev/null +++ b/latents/layers.7.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f81071320eb87371ba604950932a9d5fc2e25ffacbacac22063c0c24a4138ca +size 93064928 diff --git a/latents/layers.7.mlp/104857_131071.safetensors b/latents/layers.7.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6ed7a3fb676b5b1720a86c4f7862441a52d4acb --- /dev/null +++ b/latents/layers.7.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd4a63280e8404c5bbc7e14fab0e0efe89f178c4a7ff93d240f89f9c699f136 +size 93101312 diff --git a/latents/layers.7.mlp/26214_52427.safetensors b/latents/layers.7.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93ca3c7427ea95ca51594bb3e2bb0f9e8d9ebb91 --- /dev/null +++ b/latents/layers.7.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00f17cbecc6bd76d74dc44e107d5649347d2a6e6be132e48969dbf44551c49df +size 93927576 diff --git a/latents/layers.7.mlp/52428_78642.safetensors b/latents/layers.7.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..237a3c3a7f7e6943d5fb86ea18f48d9969eacde4 --- /dev/null +++ b/latents/layers.7.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1ddef3f8ee010e932fa74853147bb564cf9ef07ec73310b2f525c946be3283 +size 93917536 diff --git a/latents/layers.7.mlp/78643_104856.safetensors b/latents/layers.7.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69c2711dbe2d5a9d5192486653f336d7481dbdfd --- /dev/null +++ b/latents/layers.7.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bc3f9ad9d6b414802c0f928ec604e20326932ff51beb461694dc51e2aec3f9 +size 93327592 diff --git a/latents/layers.7.mlp/config.json b/latents/layers.7.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.7.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.8.mlp/0_26213.safetensors b/latents/layers.8.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc64de51479c818c644b2b80cdff72c979501e81 --- /dev/null +++ b/latents/layers.8.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06cfee68d89c111f0dbc4475e7c8e285c35a47e155fe66829684064e981ad8f5 +size 91053584 diff --git a/latents/layers.8.mlp/104857_131071.safetensors b/latents/layers.8.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..424eb00f9304b23755a9c2cc8e79594f37e55a98 --- /dev/null +++ b/latents/layers.8.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e5ea83c00be981c740a73ba30158aa98aa4a86e98c34b8f7aa5f31e7444f43c +size 92521512 diff --git a/latents/layers.8.mlp/26214_52427.safetensors b/latents/layers.8.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..420fdeb03bdd3eeb83effcc9712aaa3db4ceb743 --- /dev/null +++ b/latents/layers.8.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5705b060a732d03d1f4a49a1e5a0acdeffca781bab4c8f05fd9b3148cf35e0f0 +size 89627872 diff --git a/latents/layers.8.mlp/52428_78642.safetensors b/latents/layers.8.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fdd2d395154041ac6d4eae9dc802ea1785f9d6c --- /dev/null +++ b/latents/layers.8.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3bd9f367963265f8b0e52cc7bbb8c806eb44c8ef5a63ece34d4ea1cde4266d6 +size 88033136 diff --git a/latents/layers.8.mlp/78643_104856.safetensors b/latents/layers.8.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4fefd0d178664c3b51fac423113514be5b8bcc5 --- /dev/null +++ b/latents/layers.8.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68eaebace6115488ec1e0779a78bb7ee018e388b1e625b70861d7f6c4791d8a5 +size 90214560 diff --git a/latents/layers.8.mlp/config.json b/latents/layers.8.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.8.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/latents/layers.9.mlp/0_26213.safetensors b/latents/layers.9.mlp/0_26213.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03f35ef9852a484a17b1ee3441231adae8eaf9d3 --- /dev/null +++ b/latents/layers.9.mlp/0_26213.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e95fb284783335debf2e9cd80dbde7c7990a0075c9efc8555a9ec91fefff66 +size 107126408 diff --git a/latents/layers.9.mlp/104857_131071.safetensors b/latents/layers.9.mlp/104857_131071.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ba6a2f11d82ab42a8b95b97d6269535dfb649198 --- /dev/null +++ b/latents/layers.9.mlp/104857_131071.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8095437b26e04b66aa12cdc61441a5d68791794751c7c12acf83ed7ba5c5e785 +size 105898224 diff --git a/latents/layers.9.mlp/26214_52427.safetensors b/latents/layers.9.mlp/26214_52427.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7de1f1c39f26eaefd40bf1736e2a8675678f3b9a --- /dev/null +++ b/latents/layers.9.mlp/26214_52427.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568dc9b6f1b2aaeef36c3f4eef99468202b61e9e02db38b437adb090f0f8d14b +size 103692608 diff --git a/latents/layers.9.mlp/52428_78642.safetensors b/latents/layers.9.mlp/52428_78642.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4187e1047658eaa20e5c8e4e13ca603e874fa748 --- /dev/null +++ b/latents/layers.9.mlp/52428_78642.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798a85526270c5edb5d50ba3907cfeb841c403a8b45e3f84a263bc14d74f46d5 +size 106887800 diff --git a/latents/layers.9.mlp/78643_104856.safetensors b/latents/layers.9.mlp/78643_104856.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c49e21d8939a429defe51b1abc3a05db995315bd --- /dev/null +++ b/latents/layers.9.mlp/78643_104856.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b299692963cea4ac08d5cff315a3ac16a696bc49b09db85a41f6dd1cf8d22f +size 104064216 diff --git a/latents/layers.9.mlp/config.json b/latents/layers.9.mlp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..e15d0eb1fb235ccc57b1d72c5aaa2f72eced9fa2 --- /dev/null +++ b/latents/layers.9.mlp/config.json @@ -0,0 +1,11 @@ +{ + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5, + "model_name": "meta-llama/Llama-3.2-1B" +} \ No newline at end of file diff --git a/run_config.json b/run_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f650a3f7db363d6a11e9d8bbe217ff888ae1145d --- /dev/null +++ b/run_config.json @@ -0,0 +1,71 @@ +{ + "cache_cfg": { + "dataset_repo": "EleutherAI/fineweb-edu-dedup-10b", + "dataset_split": "train", + "dataset_name": "", + "dataset_column": "text", + "batch_size": 16, + "cache_ctx_len": 256, + "n_tokens": 1000000, + "n_splits": 5 + }, + "constructor_cfg": { + "faiss_embedding_model": "sentence-transformers/all-MiniLM-L6-v2", + "faiss_embedding_cache_dir": ".embedding_cache", + "faiss_embedding_cache_enabled": true, + "example_ctx_len": 32, + "min_examples": 200, + "n_non_activating": 50, + "center_examples": true, + "non_activating_source": "random", + "neighbours_type": "co-occurrence" + }, + "sampler_cfg": { + "n_examples_train": 40, + "n_examples_test": 50, + "n_quantiles": 10, + "train_type": "quantiles", + "test_type": "quantiles", + "ratio_top": 0.2 + }, + "model": "meta-llama/Llama-3.2-1B", + "sparse_model": "nev/Llama-3.2-1B-mntss-skip-transcoder", + "hookpoints": [ + "layers.0.mlp", + "layers.1.mlp", + "layers.2.mlp", + "layers.3.mlp", + "layers.4.mlp", + "layers.5.mlp", + "layers.6.mlp", + "layers.7.mlp", + "layers.8.mlp", + "layers.9.mlp", + "layers.10.mlp", + "layers.11.mlp", + "layers.12.mlp", + "layers.13.mlp", + "layers.14.mlp", + "layers.15.mlp" + ], + "explainer_model": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4", + "explainer_model_max_len": 5120, + "explainer_provider": "offline", + "explainer": "default", + "scorers": [ + "fuzz", + "detection" + ], + "name": "transcoder-llama-131k-mntss-1m", + "max_latents": null, + "filter_bos": false, + "log_probs": false, + "load_in_8bit": false, + "hf_token": null, + "pipeline_num_proc": 48, + "num_gpus": 1, + "seed": 22, + "verbose": true, + "num_examples_per_scorer_prompt": 5, + "overwrite": [] +} \ No newline at end of file