{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":683009618,"defaultBranch":"main","name":"alignment-handbook","ownerLogin":"huggingface","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-08-25T11:35:34.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/25720743?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1716538305.0","currentOid":""},"activityList":{"items":[{"before":"0e7c1ff69ae1378f6704ba0fb048c87f93945530","after":"33e9d644cf9325b6b4a6eba4a01815d4f85bf2ba","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T20:15:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix config","shortMessageHtmlLink":"Fix config"}},{"before":"648f25085131902c29fc52586a804e31444f0e2e","after":"0e7c1ff69ae1378f6704ba0fb048c87f93945530","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T19:52:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix configs","shortMessageHtmlLink":"Fix configs"}},{"before":"f4a4f7fd0624aadda43f4b66f031905d49d7c71a","after":"648f25085131902c29fc52586a804e31444f0e2e","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T19:42:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add base and instruct configs","shortMessageHtmlLink":"Add base and instruct configs"}},{"before":"3ee6d1e17dbe39c0a906e8901761852ddd1785c4","after":"f4a4f7fd0624aadda43f4b66f031905d49d7c71a","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T18:23:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Remove warmup","shortMessageHtmlLink":"Remove warmup"}},{"before":"94aacea14d59de4f28ed2a7bd4c800b461375477","after":"3ee6d1e17dbe39c0a906e8901761852ddd1785c4","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T09:32:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix optimizer","shortMessageHtmlLink":"Fix optimizer"}},{"before":"525143185c0e7a67eec1280aa989cad7d84ef41a","after":"94aacea14d59de4f28ed2a7bd4c800b461375477","ref":"refs/heads/orpo-report","pushedAt":"2024-05-25T08:53:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Reduce bs","shortMessageHtmlLink":"Reduce bs"}},{"before":"988d8c6b8df3281f8a5fb2aff3e79628f571d7b7","after":"525143185c0e7a67eec1280aa989cad7d84ef41a","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T21:42:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix template","shortMessageHtmlLink":"Fix template"}},{"before":"3c2e5f194c48023c2312364fb52e2d8f7bfab3da","after":"988d8c6b8df3281f8a5fb2aff3e79628f571d7b7","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T21:02:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix proc","shortMessageHtmlLink":"Fix proc"}},{"before":"52c619567066b231fb9414c0361eeac06e223964","after":"3c2e5f194c48023c2312364fb52e2d8f7bfab3da","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T12:48:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"alvarobartt","name":"Alvaro Bartolome","path":"/alvarobartt","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/36760800?s=80&v=4"},"commit":{"message":"Set `hub_private_repo: true`","shortMessageHtmlLink":"Set hub_private_repo: true"}},{"before":"5309188f175f3981bdf7effa848f6a993b2cdddc","after":"52c619567066b231fb9414c0361eeac06e223964","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T12:42:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"alvarobartt","name":"Alvaro Bartolome","path":"/alvarobartt","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/36760800?s=80&v=4"},"commit":{"message":"Update `chat_template` for Mistral 7B Instruct v0.3\n\nThe default one at https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.3/raw/main/tokenizer_config.json expects user-assistant turns, while here we need to feed user-assistant-...-user and then only assistant, meaning that the default format is not suitable for ORPO fine-tuning and needs to be updated","shortMessageHtmlLink":"Update chat_template for Mistral 7B Instruct v0.3"}},{"before":"b52ac13767e139ee254a0dcb6c0be8c7663031a2","after":"5309188f175f3981bdf7effa848f6a993b2cdddc","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T12:21:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"alvarobartt","name":"Alvaro Bartolome","path":"/alvarobartt","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/36760800?s=80&v=4"},"commit":{"message":"Update grad acc and per device bs","shortMessageHtmlLink":"Update grad acc and per device bs"}},{"before":"278607ef9cf04206f8b392c0381341d9e5ae80b2","after":"b52ac13767e139ee254a0dcb6c0be8c7663031a2","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T11:53:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add requeue","shortMessageHtmlLink":"Add requeue"}},{"before":"257fb7f98927e003fc78112bcbebcd547dfb03bc","after":"278607ef9cf04206f8b392c0381341d9e5ae80b2","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T11:47:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Tune max lenght","shortMessageHtmlLink":"Tune max lenght"}},{"before":"e60abc4a90ed76b546fe7763733d35d435d407f0","after":"257fb7f98927e003fc78112bcbebcd547dfb03bc","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T11:45:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix models and remove filter","shortMessageHtmlLink":"Fix models and remove filter"}},{"before":"0914bd7170774a27f1e84e51d3ac40d4160ec274","after":"e60abc4a90ed76b546fe7763733d35d435d407f0","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T10:08:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix configs","shortMessageHtmlLink":"Fix configs"}},{"before":"94baa4e0374e4d9551c142a59a7956cfdbc137c5","after":"0914bd7170774a27f1e84e51d3ac40d4160ec274","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T09:41:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"alvarobartt","name":"Alvaro Bartolome","path":"/alvarobartt","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/36760800?s=80&v=4"},"commit":{"message":"Add `save_ckpt.py` script\n\nIdeally to be removed later on before merging.","shortMessageHtmlLink":"Add save_ckpt.py script"}},{"before":"df02a0db180e9f6fc1ca9bf34a3443102e67b082","after":"94baa4e0374e4d9551c142a59a7956cfdbc137c5","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T09:08:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Fix repo id","shortMessageHtmlLink":"Fix repo id"}},{"before":"addcf7055c3a53626e629136f830f4fbbcdfa82c","after":"df02a0db180e9f6fc1ca9bf34a3443102e67b082","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T08:38:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Tweak","shortMessageHtmlLink":"Tweak"}},{"before":"9f5fdaa6ab868e8cf97253cc5d95a91d4ac30b2a","after":"addcf7055c3a53626e629136f830f4fbbcdfa82c","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T08:31:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add recipes","shortMessageHtmlLink":"Add recipes"}},{"before":"f857922a75d953db05b348675426a7fbd53b5050","after":"9f5fdaa6ab868e8cf97253cc5d95a91d4ac30b2a","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T08:28:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add recipe","shortMessageHtmlLink":"Add recipe"}},{"before":"606d2e954fd17999af40e6fb4f712055ca11b2f0","after":"f857922a75d953db05b348675426a7fbd53b5050","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T08:20:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Bump deps","shortMessageHtmlLink":"Bump deps"}},{"before":null,"after":"606d2e954fd17999af40e6fb4f712055ca11b2f0","ref":"refs/heads/orpo-report","pushedAt":"2024-05-24T08:11:45.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add fsdp+qlora support (#160)","shortMessageHtmlLink":"Add fsdp+qlora support (#160)"}},{"before":"5a86b3c70848f16f0e1dc0e149cb3c2b38ed1bc9","after":"2ad9d3641e43a367b494bc0b9041c06371ffc216","ref":"refs/heads/orpo-expts","pushedAt":"2024-05-10T18:12:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"foo","shortMessageHtmlLink":"foo"}},{"before":"5f43108a54c1fb792e9bb2d008ba2304e249ccc2","after":"5a86b3c70848f16f0e1dc0e149cb3c2b38ed1bc9","ref":"refs/heads/orpo-expts","pushedAt":"2024-05-09T05:46:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add mixtral","shortMessageHtmlLink":"Add mixtral"}},{"before":"84f8c92820a526fab3c4777cc364cf35518de6d8","after":"606d2e954fd17999af40e6fb4f712055ca11b2f0","ref":"refs/heads/main","pushedAt":"2024-05-08T13:08:14.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add fsdp+qlora support (#160)","shortMessageHtmlLink":"Add fsdp+qlora support (#160)"}},{"before":"ec6f4c4c794eeb5595f19f9921082c452ed26eb4","after":"5f43108a54c1fb792e9bb2d008ba2304e249ccc2","ref":"refs/heads/orpo-expts","pushedAt":"2024-05-08T12:31:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add llama3","shortMessageHtmlLink":"Add llama3"}},{"before":"3eef5bc7329e653111a421d336ab8ecd4575723c","after":"ec6f4c4c794eeb5595f19f9921082c452ed26eb4","ref":"refs/heads/orpo-expts","pushedAt":"2024-05-08T12:23:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add configs","shortMessageHtmlLink":"Add configs"}},{"before":"b63c6d3358ca6b5d7631d876ad33996f92533d22","after":"3eef5bc7329e653111a421d336ab8ecd4575723c","ref":"refs/heads/orpo-expts","pushedAt":"2024-05-07T08:49:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add configs","shortMessageHtmlLink":"Add configs"}},{"before":"cf1975a7cb7173e970bd53ad15c31156350c6f3d","after":"84f8c92820a526fab3c4777cc364cf35518de6d8","ref":"refs/heads/main","pushedAt":"2024-04-25T08:36:22.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Update README.md (#152)\n\nIf use 2.3.6, there will be an error\r\n\r\nImportError: /root/miniconda3/envs/handbook/lib/python3.10/site-packages/flash_attn_2_cuda.cpython-310-x86_64-linux-gnu.so: undefined symbol: _ZN2at4_ops9_pad_enum4callERKNS_6TensorEN3c108ArrayRefINS5_6SymIntEEElNS5_8optionalIdEE\r\n\r\nIf we use the newest flash_attn version, there will be no trouble!","shortMessageHtmlLink":"Update README.md (#152)"}},{"before":"70769f9e9ba41c7f08ba6c4ff3725441b68b7ca3","after":"cf1975a7cb7173e970bd53ad15c31156350c6f3d","ref":"refs/heads/main","pushedAt":"2024-04-25T08:35:45.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"lewtun","name":null,"path":"/lewtun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/26859204?s=80&v=4"},"commit":{"message":"Add ORPO within `README.md` files (#154)\n\n* Add `ORPO` within `scripts/README.md`\r\n\r\n* Fix typo in `ModelArguments.base_model_revision`\r\n\r\n* Add `ORPO` within `README.md`\r\n\r\n* Add Zephyr 141B in \"News\" section","shortMessageHtmlLink":"Add ORPO within README.md files (#154)"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEU9w2wgA","startCursor":null,"endCursor":null}},"title":"Activity ยท huggingface/alignment-handbook"}