{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":708424003,"defaultBranch":"main","name":"Multi-Objective-Reinforcement-Learning-from-AI-Feedback","ownerLogin":"carolius","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-10-22T14:24:23.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/35470278?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1697984664.2489522","currentOid":""},"activityList":{"items":[{"before":"5803d2ba6e85bd1a17997a001ab443d4b9ecf2a2","after":"9b6eaa16b9f607019f099dd969af9486f6166cfe","ref":"refs/heads/main","pushedAt":"2024-06-12T14:06:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated readme","shortMessageHtmlLink":"updated readme"}},{"before":"095b38eec037732f6bec6c11081711e287277bdc","after":"5803d2ba6e85bd1a17997a001ab443d4b9ecf2a2","ref":"refs/heads/main","pushedAt":"2024-06-08T19:39:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"clean up","shortMessageHtmlLink":"clean up"}},{"before":"997feebd18ce30b0efc5f26ea9398c66110d771f","after":"095b38eec037732f6bec6c11081711e287277bdc","ref":"refs/heads/main","pushedAt":"2024-06-08T19:35:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added bernoulli-nash","shortMessageHtmlLink":"added bernoulli-nash"}},{"before":"84c3afbbfb4073a08005d5fa41a62432adc8e103","after":"997feebd18ce30b0efc5f26ea9398c66110d771f","ref":"refs/heads/main","pushedAt":"2024-06-08T13:25:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"fixed images","shortMessageHtmlLink":"fixed images"}},{"before":"66f9528fbbb0bb4ee99245daf3dc8934fcde6443","after":"84c3afbbfb4073a08005d5fa41a62432adc8e103","ref":"refs/heads/main","pushedAt":"2024-06-08T13:24:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added plots","shortMessageHtmlLink":"added plots"}},{"before":"2e9c93c9267b6420a73a5e7f8ce430b61c6b9bff","after":"66f9528fbbb0bb4ee99245daf3dc8934fcde6443","ref":"refs/heads/main","pushedAt":"2024-06-08T13:23:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated README","shortMessageHtmlLink":"updated README"}},{"before":"850f4b77af005b52f62d9a082e87e551f3723199","after":"2e9c93c9267b6420a73a5e7f8ce430b61c6b9bff","ref":"refs/heads/main","pushedAt":"2024-05-06T13:51:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"changed to custom version of TRLX and various PPO bugfixes","shortMessageHtmlLink":"changed to custom version of TRLX and various PPO bugfixes"}},{"before":"0f3455a0d078940f4da26f3b2a6d5a36cf7974cd","after":"850f4b77af005b52f62d9a082e87e551f3723199","ref":"refs/heads/main","pushedAt":"2024-04-29T19:17:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added PPO scripts","shortMessageHtmlLink":"added PPO scripts"}},{"before":"515f8392a58e5ed32064ee6f26ec53d5a5cd7114","after":"0f3455a0d078940f4da26f3b2a6d5a36cf7974cd","ref":"refs/heads/main","pushedAt":"2024-04-29T18:11:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated readme","shortMessageHtmlLink":"updated readme"}},{"before":"7e4eddb65b50958e52392bb1ad599b690798925a","after":"515f8392a58e5ed32064ee6f26ec53d5a5cd7114","ref":"refs/heads/main","pushedAt":"2024-04-29T14:27:43.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added the principles for the 14 principle experiment","shortMessageHtmlLink":"added the principles for the 14 principle experiment"}},{"before":"f8bef440dbe0ec9235ce33f9a1424fede50bb126","after":"7e4eddb65b50958e52392bb1ad599b690798925a","ref":"refs/heads/main","pushedAt":"2024-04-26T07:24:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"changed principle format","shortMessageHtmlLink":"changed principle format"}},{"before":"4b4b046e98ce49703c44b8434cdfc72b87909bda","after":"f8bef440dbe0ec9235ce33f9a1424fede50bb126","ref":"refs/heads/main","pushedAt":"2024-04-26T07:22:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated requirements","shortMessageHtmlLink":"updated requirements"}},{"before":"23300560668489d1e632ec1b9c18fd7b9733faee","after":"4b4b046e98ce49703c44b8434cdfc72b87909bda","ref":"refs/heads/main","pushedAt":"2024-04-26T07:21:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"8xA100 FSDP config","shortMessageHtmlLink":"8xA100 FSDP config"}},{"before":"cf2670e602aa3433de1fd1f782d881bbf6f997ab","after":"23300560668489d1e632ec1b9c18fd7b9733faee","ref":"refs/heads/main","pushedAt":"2024-04-21T10:19:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated description","shortMessageHtmlLink":"updated description"}},{"before":"0a34d40aac42375614240a1553224a396c7154ce","after":"cf2670e602aa3433de1fd1f782d881bbf6f997ab","ref":"refs/heads/main","pushedAt":"2024-04-20T15:16:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added more results","shortMessageHtmlLink":"added more results"}},{"before":"5fa5498f8d63592ec88d44bf41def9552df07883","after":"0a34d40aac42375614240a1553224a396c7154ce","ref":"refs/heads/main","pushedAt":"2024-04-03T10:19:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"fixes","shortMessageHtmlLink":"fixes"}},{"before":"fa43141923f7800c75a6c320eb8a0e1f512558c7","after":"5fa5498f8d63592ec88d44bf41def9552df07883","ref":"refs/heads/main","pushedAt":"2024-04-03T10:18:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"misc scripts to investigate data","shortMessageHtmlLink":"misc scripts to investigate data"}},{"before":"cf6eb88e119b82c63a323c11402321b88326e35a","after":"fa43141923f7800c75a6c320eb8a0e1f512558c7","ref":"refs/heads/main","pushedAt":"2024-04-03T10:18:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"changed to fewer principles","shortMessageHtmlLink":"changed to fewer principles"}},{"before":"80ba879d4185db78a8b1482cdca6e4019dff71d1","after":"cf6eb88e119b82c63a323c11402321b88326e35a","ref":"refs/heads/main","pushedAt":"2024-04-03T10:16:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"changed prompt format","shortMessageHtmlLink":"changed prompt format"}},{"before":"7dc17dd316ff34e71d7b9bc02c240b663ca795de","after":"80ba879d4185db78a8b1482cdca6e4019dff71d1","ref":"refs/heads/main","pushedAt":"2024-03-28T09:26:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"switched to TRLX","shortMessageHtmlLink":"switched to TRLX"}},{"before":"9daeb02d0512508de34306c97482a4384e54635b","after":"7dc17dd316ff34e71d7b9bc02c240b663ca795de","ref":"refs/heads/main","pushedAt":"2024-03-24T15:11:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added PPO training for SO Constitutional AI baseline","shortMessageHtmlLink":"added PPO training for SO Constitutional AI baseline"}},{"before":"10560a6e6e16349da7e298f829ee7aa6ef75c60f","after":"9daeb02d0512508de34306c97482a4384e54635b","ref":"refs/heads/main","pushedAt":"2024-03-24T15:10:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated pm hhh benchmark","shortMessageHtmlLink":"updated pm hhh benchmark"}},{"before":"f98f58c582c49418e557a27534b399b6f267e45d","after":"10560a6e6e16349da7e298f829ee7aa6ef75c60f","ref":"refs/heads/main","pushedAt":"2024-03-24T15:10:26.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"fixed gemini feedback","shortMessageHtmlLink":"fixed gemini feedback"}},{"before":"502fc131e836886ee12ddf2f0e36ac4e365c0085","after":"f98f58c582c49418e557a27534b399b6f267e45d","ref":"refs/heads/main","pushedAt":"2024-03-21T11:11:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added PM hhh-alignment benchmark","shortMessageHtmlLink":"added PM hhh-alignment benchmark"}},{"before":"fdd663fdd1efe936a6d410ac6ace731aab1d7ac1","after":"502fc131e836886ee12ddf2f0e36ac4e365c0085","ref":"refs/heads/main","pushedAt":"2024-03-20T12:12:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"clean up","shortMessageHtmlLink":"clean up"}},{"before":"de0a70bbfa2b1c6104e3f18cbd630600931e3788","after":"fdd663fdd1efe936a6d410ac6ace731aab1d7ac1","ref":"refs/heads/main","pushedAt":"2024-03-20T12:08:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added gemini feedback model support","shortMessageHtmlLink":"added gemini feedback model support"}},{"before":"1a9d55922902f52d17f7eb1499684b6e5cdb426f","after":"de0a70bbfa2b1c6104e3f18cbd630600931e3788","ref":"refs/heads/main","pushedAt":"2024-03-04T13:28:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"Now sends feedback api requests in parallel (much faster)","shortMessageHtmlLink":"Now sends feedback api requests in parallel (much faster)"}},{"before":"52dc3b12a560008602caf44bf13b20879b4105df","after":"1a9d55922902f52d17f7eb1499684b6e5cdb426f","ref":"refs/heads/main","pushedAt":"2024-02-23T10:34:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"updated readme","shortMessageHtmlLink":"updated readme"}},{"before":"3705e3e1ef0fbba9ce9d6b42ba38a91c82f60b20","after":"52dc3b12a560008602caf44bf13b20879b4105df","ref":"refs/heads/main","pushedAt":"2024-02-23T10:31:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"reduced duplicate code","shortMessageHtmlLink":"reduced duplicate code"}},{"before":"e9b5d3b9ed4d5db0b4c36d1d19d28c60776211da","after":"3705e3e1ef0fbba9ce9d6b42ba38a91c82f60b20","ref":"refs/heads/main","pushedAt":"2024-02-21T19:31:31.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"carolius","name":"Marcus Williams","path":"/carolius","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/35470278?s=80&v=4"},"commit":{"message":"added more PM training scripts","shortMessageHtmlLink":"added more PM training scripts"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEY2SHOQA","startCursor":null,"endCursor":null}},"title":"Activity ยท carolius/Multi-Objective-Reinforcement-Learning-from-AI-Feedback"}