{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":742986742,"defaultBranch":"main","name":"fsdp_qlora","ownerLogin":"AnswerDotAI","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-01-14T00:34:42.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/156509747?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1715439319.0","currentOid":""},"activityList":{"items":[{"before":"cec4386685702a9f6f36fbb04a3a9a370f0981eb","after":"05ed9f2a60f96a0795cb082bceab70a9b19fd213","ref":"refs/heads/main","pushedAt":"2024-06-13T20:11:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"warner-benjamin","name":"Benjamin Warner","path":"/warner-benjamin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/51142400?s=80&v=4"},"commit":{"message":"don't print the batch idx every step","shortMessageHtmlLink":"don't print the batch idx every step"}},{"before":"ed431272fd95b8ff57b5b12aff0f0cbdbd29cf96","after":"cec4386685702a9f6f36fbb04a3a9a370f0981eb","ref":"refs/heads/main","pushedAt":"2024-06-11T03:37:26.000Z","pushType":"pr_merge","commitsCount":18,"pusher":{"login":"austinvhuang","name":"Austin Huang","path":"/austinvhuang","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20875313?s=80&v=4"},"commit":{"message":"Merge pull request #67 from jeromeku/profiling\n\n[FEATURE] Profiling Improvements","shortMessageHtmlLink":"Merge pull request #67 from jeromeku/profiling"}},{"before":"f2585b59092f33e8464deca7411c938fa49ee886","after":"1666c7991c422c3e1bb38c3d345a1c8fac8a46c7","ref":"refs/heads/qwen","pushedAt":"2024-06-10T16:15:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"dharma-2 eval","shortMessageHtmlLink":"dharma-2 eval"}},{"before":"62d3ef6453ad4cac705056a87850459631c71b47","after":"f2585b59092f33e8464deca7411c938fa49ee886","ref":"refs/heads/qwen","pushedAt":"2024-06-10T10:34:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"hqq plus plus training","shortMessageHtmlLink":"hqq plus plus training"}},{"before":"1a9fddfb660b85e46bdf18c3fcf0d599628c9c6c","after":"ed431272fd95b8ff57b5b12aff0f0cbdbd29cf96","ref":"refs/heads/main","pushedAt":"2024-05-20T21:11:20.000Z","pushType":"pr_merge","commitsCount":5,"pusher":{"login":"austinvhuang","name":"Austin Huang","path":"/austinvhuang","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20875313?s=80&v=4"},"commit":{"message":"Merge pull request #66 from AnswerDotAI/avh_dev\n\nAdd profiling to train.py","shortMessageHtmlLink":"Merge pull request #66 from AnswerDotAI/avh_dev"}},{"before":"cc9e45a833fcbdd5b4bc9ebdeb5086b25b49bb7b","after":"fdc3c7e19ca64c0eebdf2a9128a1a47dec1426e9","ref":"refs/heads/avh_dev","pushedAt":"2024-05-20T21:10:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"austinvhuang","name":"Austin Huang","path":"/austinvhuang","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20875313?s=80&v=4"},"commit":{"message":"add comment to profile.sh","shortMessageHtmlLink":"add comment to profile.sh"}},{"before":"bc91ebe544b167d891fc761e3dd73b519ce102f2","after":"cc9e45a833fcbdd5b4bc9ebdeb5086b25b49bb7b","ref":"refs/heads/avh_dev","pushedAt":"2024-05-20T20:51:09.000Z","pushType":"push","commitsCount":6,"pusher":{"login":"austinvhuang","name":"Austin Huang","path":"/austinvhuang","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20875313?s=80&v=4"},"commit":{"message":"Since fsdp_qlora doesnt use argparse, change Param -> str and bool_arg -> bool per https://github.com/AnswerDotAI/fsdp_qlora/pull/66#discussion_r1592876114 also move descriptions to a docstring","shortMessageHtmlLink":"Since fsdp_qlora doesnt use argparse, change Param -> str and bool_ar…"}},{"before":"afc51cafc34f7ed6bc06e2130a56545d97b554e7","after":null,"ref":"refs/heads/medusa","pushedAt":"2024-05-11T14:55:19.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"griff4692","name":"Griffin Adams","path":"/griff4692","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12277915?s=80&v=4"}},{"before":"a3016d66acd06391f211f93cb4f40ff1a2090dbd","after":"afc51cafc34f7ed6bc06e2130a56545d97b554e7","ref":"refs/heads/medusa","pushedAt":"2024-05-11T14:41:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"griff4692","name":"Griffin Adams","path":"/griff4692","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12277915?s=80&v=4"},"commit":{"message":"Add in token accuracies.","shortMessageHtmlLink":"Add in token accuracies."}},{"before":"7f1e00d9f37c7a1b85a56c4652ee680cedffbd43","after":"a3016d66acd06391f211f93cb4f40ff1a2090dbd","ref":"refs/heads/medusa","pushedAt":"2024-05-10T19:01:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"griff4692","name":"Griffin Adams","path":"/griff4692","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12277915?s=80&v=4"},"commit":{"message":"Update wrapping policy.","shortMessageHtmlLink":"Update wrapping policy."}},{"before":null,"after":"7f1e00d9f37c7a1b85a56c4652ee680cedffbd43","ref":"refs/heads/medusa","pushedAt":"2024-05-09T17:24:40.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"griff4692","name":"Griffin Adams","path":"/griff4692","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/12277915?s=80&v=4"},"commit":{"message":"Naive implementation of Medusa.","shortMessageHtmlLink":"Naive implementation of Medusa."}},{"before":"0f10515908832a95656f4414a3c276b7b3e064fd","after":"62d3ef6453ad4cac705056a87850459631c71b47","ref":"refs/heads/qwen","pushedAt":"2024-05-09T09:19:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"instruct zero, few, full results","shortMessageHtmlLink":"instruct zero, few, full results"}},{"before":"23fafdfb4af403d0808038adafbfd74de265d33a","after":"1a9fddfb660b85e46bdf18c3fcf0d599628c9c6c","ref":"refs/heads/main","pushedAt":"2024-05-08T23:42:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"warner-benjamin","name":"Benjamin Warner","path":"/warner-benjamin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/51142400?s=80&v=4"},"commit":{"message":"set_num_threads wifh CPU offload and add fused Adam support","shortMessageHtmlLink":"set_num_threads wifh CPU offload and add fused Adam support"}},{"before":"48c3d584386e015804487f1f47265cb1e9c31830","after":"0f10515908832a95656f4414a3c276b7b3e064fd","ref":"refs/heads/qwen","pushedAt":"2024-05-08T14:31:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"hqq axis=1 training checked","shortMessageHtmlLink":"hqq axis=1 training checked"}},{"before":"72741d61ac9ab7f9f9d1a5c758fb8a5e5232a5a8","after":"48c3d584386e015804487f1f47265cb1e9c31830","ref":"refs/heads/qwen","pushedAt":"2024-05-08T12:28:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"fix model weight prep for lora","shortMessageHtmlLink":"fix model weight prep for lora"}},{"before":"2ea3859c8f1ab66f9d5fd1b2be60c61824ede207","after":"72741d61ac9ab7f9f9d1a5c758fb8a5e5232a5a8","ref":"refs/heads/qwen","pushedAt":"2024-05-08T11:58:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"fix custom lora+","shortMessageHtmlLink":"fix custom lora+"}},{"before":"8812e0b8add51d82f35993bcc3fb78095694987e","after":"2ea3859c8f1ab66f9d5fd1b2be60c61824ede207","ref":"refs/heads/qwen","pushedAt":"2024-05-08T08:25:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"minor fixes and loftq model weights prep","shortMessageHtmlLink":"minor fixes and loftq model weights prep"}},{"before":"2335454eefbae41346b958d55bdbdfb4aa4874cb","after":"8812e0b8add51d82f35993bcc3fb78095694987e","ref":"refs/heads/qwen","pushedAt":"2024-05-07T14:37:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"kick off lora+ and loftq exps orca math","shortMessageHtmlLink":"kick off lora+ and loftq exps orca math"}},{"before":"ff6c1628aca7046ef36ac5235410e80fb5f29397","after":"2335454eefbae41346b958d55bdbdfb4aa4874cb","ref":"refs/heads/qwen","pushedAt":"2024-05-07T08:29:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"save loftq weights","shortMessageHtmlLink":"save loftq weights"}},{"before":"f7055c9bb67f8b8bd2c5071b46cfab33d87dd4a4","after":"23fafdfb4af403d0808038adafbfd74de265d33a","ref":"refs/heads/main","pushedAt":"2024-05-06T22:12:24.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"johnowhitaker","name":"Jonathan Whitaker","path":"/johnowhitaker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6575163?s=80&v=4"},"commit":{"message":"Merge pull request #65 from AnswerDotAI/benchmark_post\n\nCreate benchmarks_03_2024.md","shortMessageHtmlLink":"Merge pull request #65 from AnswerDotAI/benchmark_post"}},{"before":null,"after":"bc91ebe544b167d891fc761e3dd73b519ce102f2","ref":"refs/heads/avh_dev","pushedAt":"2024-05-06T20:18:41.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"austinvhuang","name":"Austin Huang","path":"/austinvhuang","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20875313?s=80&v=4"},"commit":{"message":"Add profiling capabilities to train.py. Add profile_output argument, update fsdp_main() to write per-thread profiling outputs, make train.py usable as an import, add profile.sh as an example profiling invocation, remove HQQ commit pin message in README since to_empty() method was removed from HQQLinear","shortMessageHtmlLink":"Add profiling capabilities to train.py. Add profile_output argument, …"}},{"before":"45cb175277015e13bdebe034226e0e5f234330d5","after":"ff6c1628aca7046ef36ac5235410e80fb5f29397","ref":"refs/heads/qwen","pushedAt":"2024-05-06T16:24:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"loftq init","shortMessageHtmlLink":"loftq init"}},{"before":"a704afa7e2725cdecf8e91de6787f363d16eae1f","after":"45cb175277015e13bdebe034226e0e5f234330d5","ref":"refs/heads/qwen","pushedAt":"2024-05-06T11:13:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"lora+","shortMessageHtmlLink":"lora+"}},{"before":"4cd69234f84de9f4f4933904b8824ab9f2c2a004","after":"e877dda5026dfd964cccdb92a4532da587cbdae0","ref":"refs/heads/benchmark_post","pushedAt":"2024-05-04T03:59:54.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"johnowhitaker","name":"Jonathan Whitaker","path":"/johnowhitaker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6575163?s=80&v=4"},"commit":{"message":"Add authors","shortMessageHtmlLink":"Add authors"}},{"before":"f7055c9bb67f8b8bd2c5071b46cfab33d87dd4a4","after":"4cd69234f84de9f4f4933904b8824ab9f2c2a004","ref":"refs/heads/benchmark_post","pushedAt":"2024-05-04T03:52:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"johnowhitaker","name":"Jonathan Whitaker","path":"/johnowhitaker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6575163?s=80&v=4"},"commit":{"message":"Create benchmarks_03_2024.md","shortMessageHtmlLink":"Create benchmarks_03_2024.md"}},{"before":null,"after":"f7055c9bb67f8b8bd2c5071b46cfab33d87dd4a4","ref":"refs/heads/benchmark_post","pushedAt":"2024-05-04T03:44:11.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"johnowhitaker","name":"Jonathan Whitaker","path":"/johnowhitaker","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6575163?s=80&v=4"},"commit":{"message":"Merge pull request #64 from UmerHA/main\n\nAdd n_bits param to pass to hqq","shortMessageHtmlLink":"Merge pull request #64 from UmerHA/main"}},{"before":"58bdd90d0fbbcf1a006d1d67851c840dec84f880","after":"a704afa7e2725cdecf8e91de6787f363d16eae1f","ref":"refs/heads/qwen","pushedAt":"2024-05-02T18:46:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"add orca math instruct","shortMessageHtmlLink":"add orca math instruct"}},{"before":"bc8854115a5d81b672be8de4b9b82435bc689eee","after":"58bdd90d0fbbcf1a006d1d67851c840dec84f880","ref":"refs/heads/qwen","pushedAt":"2024-05-02T12:19:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"orca math eval nb","shortMessageHtmlLink":"orca math eval nb"}},{"before":"4bdf8791429adffb3211c067d5f25aa321e2ec95","after":"bc8854115a5d81b672be8de4b9b82435bc689eee","ref":"refs/heads/qwen","pushedAt":"2024-05-02T11:55:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"fix lora merge and reorg","shortMessageHtmlLink":"fix lora merge and reorg"}},{"before":"abc205553c74cd07d5094e5fa8f3df69499d3b9c","after":"4bdf8791429adffb3211c067d5f25aa321e2ec95","ref":"refs/heads/qwen","pushedAt":"2024-05-02T10:54:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KeremTurgutlu","name":"Kerem Turgutlu","path":"/KeremTurgutlu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19826777?s=80&v=4"},"commit":{"message":"weight prep for inference","shortMessageHtmlLink":"weight prep for inference"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEZNANLgA","startCursor":null,"endCursor":null}},"title":"Activity · AnswerDotAI/fsdp_qlora"}