{"payload":{"pageCount":5,"repositories":[{"type":"Public","name":"w2s","owner":"EleutherAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":7,"forksCount":0,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,23,6,9,8,3,10],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-18T22:32:05.979Z"}},{"type":"Public","name":"lm-evaluation-harness","owner":"EleutherAI","isFork":false,"description":"A framework for few-shot evaluation of language models.","allTopics":["transformer","language-model","evaluation-framework"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":68,"issueCount":210,"starsCount":5599,"forksCount":1483,"license":"MIT License","participation":[98,82,77,118,51,24,82,153,84,71,64,43,71,60,9,40,22,40,8,53,18,36,67,102,33,42,27,5,9,16,15,12,13,13,6,19,15,16,10,10,5,5,0,4,5,14,10,2,12,9,11,10],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-18T18:35:00.876Z"}},{"type":"Public","name":"gpt-neox","owner":"EleutherAI","isFork":false,"description":"An implementation of model parallel autoregressive transformers on GPUs, based on the Megatron and DeepSpeed libraries","allTopics":["transformers","language-model","gpt-3","deepspeed-library"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":23,"issueCount":55,"starsCount":6669,"forksCount":970,"license":"Apache License 2.0","participation":[10,0,9,1,1,1,1,2,0,2,0,0,10,8,9,1,0,2,0,7,3,1,1,3,1,0,19,1,4,3,1,3,3,1,0,7,7,8,2,1,7,0,0,0,2,5,1,1,5,0,5,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T22:29:24.603Z"}},{"type":"Public","name":"elk","owner":"EleutherAI","isFork":false,"description":"Keeping language models honest by directly eliciting knowledge encoded in their activations.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":13,"starsCount":172,"forksCount":32,"license":"MIT License","participation":[3,4,3,2,12,27,3,9,0,7,3,1,0,1,0,0,0,1,3,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T17:37:48.670Z"}},{"type":"Public","name":"cupbearer","owner":"EleutherAI","isFork":true,"description":"A library for mechanistic anomaly detection","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":4,"license":"MIT License","participation":[17,42,17,2,2,5,14,5,13,7,5,0,2,7,2,0,0,12,9,10,5,16,21,14,1,5,0,0,0,6,5,3,0,8,30,3,35,12,0,3,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T02:47:50.122Z"}},{"type":"Public","name":"website","owner":"EleutherAI","isFork":false,"description":"New website for EleutherAI based on Hugo static site generator","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":2,"issueCount":0,"starsCount":4,"forksCount":6,"license":null,"participation":[2,0,3,0,0,8,0,0,0,2,0,0,0,12,0,0,9,8,9,2,1,10,3,11,11,9,21,0,0,0,0,0,2,0,0,0,8,0,0,7,18,0,19,2,0,0,0,0,18,0,0,14],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-15T03:52:41.968Z"}},{"type":"Public","name":"semantic-memorization","owner":"EleutherAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":5,"issueCount":0,"starsCount":34,"forksCount":3,"license":null,"participation":[1,9,2,0,3,3,0,0,2,6,4,29,15,2,0,0,4,1,0,6,0,0,1,0,0,5,2,1,0,3,29,0,3,5,0,5,1,0,4,3,0,1,0,1,0,1,0,0,0,2,3,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-14T00:29:12.702Z"}},{"type":"Public","name":"sae","owner":"EleutherAI","isFork":false,"description":"Sparse autoencoders","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":80,"forksCount":5,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,1,10,5],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-13T23:06:43.275Z"}},{"type":"Public","name":"aria","owner":"EleutherAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":37,"forksCount":6,"license":"Apache License 2.0","participation":[1,0,0,1,1,1,3,13,2,0,0,0,0,0,5,6,8,3,1,8,6,0,1,3,5,9,1,0,0,0,3,10,1,2,0,4,0,2,2,0,0,0,0,1,0,0,0,1,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-13T17:02:44.519Z"}},{"type":"Public","name":"tokengrams","owner":"EleutherAI","isFork":false,"description":"Efficiently computing &amp; storing token n-grams from large corpora","allTopics":[],"primaryLanguage":{"name":"Rust","color":"#dea584"},"pullRequestCount":0,"issueCount":1,"starsCount":7,"forksCount":1,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,5,4,0,0,0,1,0,0,0,0,0,9,3,24,0,0,0,0,0,0,0,0,0,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-13T06:57:49.852Z"}},{"type":"Public","name":"features-across-time","owner":"EleutherAI","isFork":false,"description":"Understanding how features learned by neural networks evolve throughout training","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":26,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T04:45:50.297Z"}},{"type":"Public","name":"aria-amt","owner":"EleutherAI","isFork":false,"description":"Efficient and robust implementation of seq-to-seq automatic piano transcription.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":12,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-04T16:17:13.457Z"}},{"type":"Public","name":"rnngineering","owner":"EleutherAI","isFork":false,"description":"Engineering the state of RNN language models (Mamba, RWKV, etc.)","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":31,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-25T16:13:46.749Z"}},{"type":"Public","name":"cookbook","owner":"EleutherAI","isFork":false,"description":"Deep learning for dummies. All the practical details and useful utilities that go into working with real models.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":6,"starsCount":204,"forksCount":13,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,13,4,5,0,0,3,0,1,5,1,0,3,0,0,0,0,0,1,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-24T06:59:44.529Z"}},{"type":"Public","name":"bayesian-adam","owner":"EleutherAI","isFork":false,"description":"Exactly what it says on the tin","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-24T05:26:48.375Z"}},{"type":"Public","name":"elk-generalization","owner":"EleutherAI","isFork":false,"description":"Investigating the generalization behavior of LM probes trained to predict truth labels: (1) from one annotator to another, and (2) from easy questions to hard","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":22,"forksCount":4,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,2,1,3,5,7,13,15,10,33,12,8,10,4,8,0,0,18,8,9,7,31,5,7,1,0,8,4,1,4,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T23:25:42.706Z"}},{"type":"Public","name":"tuned-lens","owner":"EleutherAI","isFork":true,"description":"Tools for understanding how transformer predictions are built layer-by-layer","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":37,"license":"MIT License","participation":[0,0,1,2,0,0,0,0,0,0,7,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,3,0,0,0,0,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T20:10:19.155Z"}},{"type":"Public","name":"concept-erasure","owner":"EleutherAI","isFork":false,"description":"Erasing concepts from neural representations with provable guarantees","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":196,"forksCount":15,"license":"MIT License","participation":[4,1,1,0,0,5,0,0,3,5,1,1,0,7,0,6,1,0,0,0,0,0,0,0,0,0,0,0,0,3,4,3,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,2,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-23T05:15:19.958Z"}},{"type":"Public","name":"SAELens","owner":"EleutherAI","isFork":true,"description":"Training Sparse Autoencoders on Language Models","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":60,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-22T19:41:40.681Z"}},{"type":"Public","name":"pythia","owner":"EleutherAI","isFork":false,"description":"The hub for EleutherAI's work on interpretability and learning dynamics","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":2,"issueCount":18,"starsCount":2102,"forksCount":153,"license":"Apache License 2.0","participation":[0,2,0,0,1,0,0,0,0,0,0,0,0,0,0,11,0,0,1,18,17,1,0,0,0,0,0,2,0,0,0,0,1,0,0,1,0,0,2,0,0,0,1,0,1,1,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-22T01:45:07.678Z"}},{"type":"Public","name":"weak-to-strong","owner":"EleutherAI","isFork":true,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":2,"starsCount":6,"forksCount":294,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-10T17:59:25.843Z"}},{"type":"Public","name":"variance-across-time","owner":"EleutherAI","isFork":false,"description":"Studying the variance in neural net predictions across training time","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T07:12:33.410Z"}},{"type":"Public","name":"DeeperSpeed","owner":"EleutherAI","isFork":true,"description":"DeepSpeed is a deep learning optimization library that makes distributed training easy, efficient, and effective.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":159,"forksCount":3928,"license":"Apache License 2.0","participation":[25,13,20,15,24,20,7,14,13,22,16,20,15,16,8,32,9,14,11,20,24,12,5,0,0,0,0,0,0,0,1,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-22T07:31:01.226Z"}},{"type":"Public","name":"improved-t5","owner":"EleutherAI","isFork":false,"description":"Experiments for efforts to train a new and improved t5","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":75,"forksCount":5,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-15T05:51:48.509Z"}},{"type":"Public","name":"CAA","owner":"EleutherAI","isFork":true,"description":"Steering Llama 2 with Contrastive Activation Addition","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":22,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-28T21:51:28.715Z"}},{"type":"Public","name":"math-lm","owner":"EleutherAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":9,"starsCount":998,"forksCount":75,"license":"MIT License","participation":[4,16,11,5,0,2,0,0,0,0,0,0,2,0,17,13,29,14,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-12T05:10:40.751Z"}},{"type":"Public","name":"pd-books","owner":"EleutherAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-07T20:44:37.188Z"}},{"type":"Public","name":"RWKV-LM","owner":"EleutherAI","isFork":true,"description":"RWKV is an RNN with transformer-level LLM performance. It can be directly trained like a GPT (parallelizable). So it's combining the best of RNN and transformer - great performance, fast inference, saves VRAM, fast training, \"infinite\" ctx_len, and free sentence embedding.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":815,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-21T10:01:35.441Z"}},{"type":"Public","name":"minetest","owner":"EleutherAI","isFork":true,"description":"Minetest is an open source voxel game engine with easy modding and game creation","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":5,"issueCount":16,"starsCount":59,"forksCount":1963,"license":"Other","participation":[0,0,4,9,8,3,2,0,1,10,10,5,1,0,1,0,0,0,0,0,0,2,0,5,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-19T22:53:24.144Z"}},{"type":"Public","name":"conceptual-constraints","owner":"EleutherAI","isFork":false,"description":"Applying LEACE to models during training","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-17T01:46:51.746Z"}}],"repositoryCount":138,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}