{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":792037482,"defaultBranch":"main","name":"training","ownerLogin":"instructlab","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-04-25T21:16:44.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/160199024?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1727096754.0","currentOid":""},"activityList":{"items":[{"before":"a99717baff50a5c9c21a08fbcb19ac78cd6559ff","after":null,"ref":"refs/heads/dependabot/github_actions/pypa/gh-action-pypi-publish-1.10.1","pushedAt":"2024-09-23T13:05:54.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"dependabot[bot]","name":null,"path":"/apps/dependabot","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/29110?s=80&v=4"}},{"before":null,"after":"4636ee09f3f331991e449ebbd1a36c89a1462ff0","ref":"refs/heads/dependabot/github_actions/pypa/gh-action-pypi-publish-1.10.2","pushedAt":"2024-09-23T13:05:49.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"dependabot[bot]","name":null,"path":"/apps/dependabot","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/29110?s=80&v=4"},"commit":{"message":"Bump pypa/gh-action-pypi-publish from 1.9.0 to 1.10.2\n\nBumps [pypa/gh-action-pypi-publish](https://github.com/pypa/gh-action-pypi-publish) from 1.9.0 to 1.10.2.\n- [Release notes](https://github.com/pypa/gh-action-pypi-publish/releases)\n- [Commits](https://github.com/pypa/gh-action-pypi-publish/compare/ec4db0b4ddc65acdf4bff5fa45ac92d78b56bdf0...897895f1e160c830e369f9779632ebc134688e1b)\n\n---\nupdated-dependencies:\n- dependency-name: pypa/gh-action-pypi-publish\n dependency-type: direct:production\n update-type: version-update:semver-minor\n...\n\nSigned-off-by: dependabot[bot] ","shortMessageHtmlLink":"Bump pypa/gh-action-pypi-publish from 1.9.0 to 1.10.2"}},{"before":null,"after":"3e9b6401a5284cb1e0bedfe1434516a615d2f2ee","ref":"refs/heads/kx/moe","pushedAt":"2024-09-20T22:47:26.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"xukai92","name":"Kai Xu","path":"/xukai92","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/5985769?s=80&v=4"},"commit":{"message":"feat: different modular training for MoEs\n\nSigned-off-by: Kai Xu ","shortMessageHtmlLink":"feat: different modular training for MoEs"}},{"before":"e54fceeebe81152463cee959f8c7bcc24d5f0f98","after":"48a61a1ccab844c0c842c2d5abcb01ab0a7bd688","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-20T17:21:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Fix lora ckpt saving\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Fix lora ckpt saving"}},{"before":"eaf290e9006a3bb6bef98fcbeb8d0a85b7db5c15","after":"e54fceeebe81152463cee959f8c7bcc24d5f0f98","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-20T16:47:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Connect new lora save patch\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Connect new lora save patch"}},{"before":"6b6f062e6ed0d5b31ecae95d43bff737f743a117","after":"eaf290e9006a3bb6bef98fcbeb8d0a85b7db5c15","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-20T16:36:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Adding lora/qlora saving pt2\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Adding lora/qlora saving pt2"}},{"before":null,"after":"60b1344fc5ec5a70a623c9ae65d403769a646040","ref":"refs/heads/jkunstle-gaudi-debugging","pushedAt":"2024-09-20T16:29:35.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"JamesKunstle","name":"James Kunstle","path":"/JamesKunstle","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/52969093?s=80&v=4"},"commit":{"message":"tmp modifications to get loop working on Gaudi cards\n\nSigned-off-by: devcloud ","shortMessageHtmlLink":"tmp modifications to get loop working on Gaudi cards"}},{"before":"e20231de5b68be5b4482ec55a6c23a7f1e5a48d9","after":"6b6f062e6ed0d5b31ecae95d43bff737f743a117","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-19T15:33:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Re-add save per epoch\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Re-add save per epoch"}},{"before":"76f6ee75804c6defc5aaaff870ea44ad375f2f8a","after":"4f9a859ed5c04418d7097a813fb015269a8b08e0","ref":"refs/heads/ap/mixtral","pushedAt":"2024-09-19T14:20:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"stage 2, stage 3 doesn't save like that","shortMessageHtmlLink":"stage 2, stage 3 doesn't save like that"}},{"before":"092f14e83361887ef98ace19521d64e14f5e41fd","after":"e20231de5b68be5b4482ec55a6c23a7f1e5a48d9","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-19T14:08:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Add lora ckpt saving (first pass)\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Add lora ckpt saving (first pass)"}},{"before":"ac10ee711304632d126b05186617090fd7ce2a8a","after":"092f14e83361887ef98ace19521d64e14f5e41fd","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T21:12:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Move sharding strategy to fsdp options\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Move sharding strategy to fsdp options"}},{"before":"2178f63ddb128bc09100140a08b40f9d64f9a5b8","after":"ac10ee711304632d126b05186617090fd7ce2a8a","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T21:07:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Added cpu offloading for fsdp\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Added cpu offloading for fsdp"}},{"before":"0b4d5161238b86009c6a48da87430401684e47bf","after":"2178f63ddb128bc09100140a08b40f9d64f9a5b8","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T20:51:07.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"RobotSail","name":"Oleg","path":"/RobotSail","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/97077423?s=80&v=4"},"commit":{"message":"bug fixes\n\nSigned-off-by: Oleg S <97077423+RobotSail@users.noreply.github.com>","shortMessageHtmlLink":"bug fixes"}},{"before":"e19411f78f193adaa966916e1059f3d031dd963f","after":"76f6ee75804c6defc5aaaff870ea44ad375f2f8a","ref":"refs/heads/ap/mixtral","pushedAt":"2024-09-18T20:49:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"not doing cpu offloading because of versions problems","shortMessageHtmlLink":"not doing cpu offloading because of versions problems"}},{"before":"3e9b6401a5284cb1e0bedfe1434516a615d2f2ee","after":"e19411f78f193adaa966916e1059f3d031dd963f","ref":"refs/heads/ap/mixtral","pushedAt":"2024-09-18T20:20:36.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"stage 3 training","shortMessageHtmlLink":"stage 3 training"}},{"before":"560c2ec0a25f971f92fc71ca8ddfcb65c3f113ab","after":"0b4d5161238b86009c6a48da87430401684e47bf","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T19:11:22.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"fixing linting errors\n\nSigned-off-by: aldo pareja-cardona ","shortMessageHtmlLink":"fixing linting errors"}},{"before":"ee3780817fc5a9ea730fd8fe8ece0858fe5f2164","after":"560c2ec0a25f971f92fc71ca8ddfcb65c3f113ab","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T19:09:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"fixing linting errors","shortMessageHtmlLink":"fixing linting errors"}},{"before":"99ae37fd26d4eaddd4da20cd9a18c4874caf0d25","after":"ee3780817fc5a9ea730fd8fe8ece0858fe5f2164","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T18:49:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"aligning with the latest","shortMessageHtmlLink":"aligning with the latest"}},{"before":null,"after":"99ae37fd26d4eaddd4da20cd9a18c4874caf0d25","ref":"refs/heads/ap/accelerate-fsdp-tmp2","pushedAt":"2024-09-18T18:44:31.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"fixed a merge conflict","shortMessageHtmlLink":"fixed a merge conflict"}},{"before":"c27f19099dadddd11c0adb700b2852ff4361e506","after":"6196694b851ea27997e6ffcb7625d7180f31a795","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T17:30:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Cleanup pt2 and connect fsdp offloading","shortMessageHtmlLink":"Cleanup pt2 and connect fsdp offloading"}},{"before":"91f143700c19ded574941508aa4f90c6233411a0","after":"c27f19099dadddd11c0adb700b2852ff4361e506","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T15:10:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RobotSail","name":"Oleg","path":"/RobotSail","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/97077423?s=80&v=4"},"commit":{"message":"bug fixes\n\nSigned-off-by: Oleg S <97077423+RobotSail@users.noreply.github.com>","shortMessageHtmlLink":"bug fixes"}},{"before":"c7ee974aa7160caca8a582fad466ddedc5018e6f","after":"91f143700c19ded574941508aa4f90c6233411a0","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T14:03:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Maxusmusti","name":"Mustafa Eyceoz","path":"/Maxusmusti","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10506868?s=80&v=4"},"commit":{"message":"Cleanup pt1\n\nSigned-off-by: Mustafa Eyceoz ","shortMessageHtmlLink":"Cleanup pt1"}},{"before":"573f598649b791a1e97db823817f3fa52ca41654","after":"c7ee974aa7160caca8a582fad466ddedc5018e6f","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T13:53:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RobotSail","name":"Oleg","path":"/RobotSail","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/97077423?s=80&v=4"},"commit":{"message":"update init.py\n\nSigned-off-by: Oleg S <97077423+RobotSail@users.noreply.github.com>","shortMessageHtmlLink":"update init.py"}},{"before":"767b225237b28ff9e16e77429e1a477188565da8","after":"573f598649b791a1e97db823817f3fa52ca41654","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T13:51:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"RobotSail","name":"Oleg","path":"/RobotSail","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/97077423?s=80&v=4"},"commit":{"message":"update: rename arguments and add config options in trainingargs\n\nThis commit updates sharding_framework to now be distributed_training_framework.\nAlso added is the ability to specify the distributed_training_framework\nin the TrainingArgs object in addition to the sharding strategy and a\nplaceholder for the FSDPOptions object.\n\nSigned-off-by: Oleg S <97077423+RobotSail@users.noreply.github.com>","shortMessageHtmlLink":"update: rename arguments and add config options in trainingargs"}},{"before":"e1d7a6e0ad6795af44300a4c5b5f226a1b80e317","after":"767b225237b28ff9e16e77429e1a477188565da8","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T13:11:14.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"removed weight decay from the fsdp optimizer","shortMessageHtmlLink":"removed weight decay from the fsdp optimizer"}},{"before":"5e7db2ca8a21e91802f28d3189361800df85fec0","after":"e1d7a6e0ad6795af44300a4c5b5f226a1b80e317","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T02:59:31.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"fsdp needs a different optimizer workflow","shortMessageHtmlLink":"fsdp needs a different optimizer workflow"}},{"before":"9b737218114893a71f94fea56e00e47ce4b08a95","after":"5e7db2ca8a21e91802f28d3189361800df85fec0","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T02:28:35.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"added samples seen to the logging","shortMessageHtmlLink":"added samples seen to the logging"}},{"before":"4ae4984e7656a38032d6bd329e0f918432295687","after":"9b737218114893a71f94fea56e00e47ce4b08a95","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T02:07:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"fixed typo on batch size logging","shortMessageHtmlLink":"fixed typo on batch size logging"}},{"before":"498cb143fcfee04e6aead48bae1078d584119ea6","after":"4ae4984e7656a38032d6bd329e0f918432295687","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T01:39:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"black formatting","shortMessageHtmlLink":"black formatting"}},{"before":"df05d4f8242778de0c9cb8e8d80834937ca102e5","after":"498cb143fcfee04e6aead48bae1078d584119ea6","ref":"refs/heads/ap/accelerate-fsdp","pushedAt":"2024-09-18T01:37:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"aldopareja","name":"Aldo Pareja","path":"/aldopareja","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/7622817?s=80&v=4"},"commit":{"message":"made deepspeed the default","shortMessageHtmlLink":"made deepspeed the default"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"Y3Vyc29yOnYyOpK7MjAyNC0wOS0yM1QxMzowNTo1NC4wMDAwMDBazwAAAAS9-8Tv","startCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wOS0yM1QxMzowNTo1NC4wMDAwMDBazwAAAAS9-8Tv","endCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wOS0xOFQwMTozNzo1Ni4wMDAwMDBazwAAAAS5IqxT"}},"title":"Activity ยท instructlab/training"}