{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":743870569,"defaultBranch":"develop","name":"InternEvo","ownerLogin":"InternLM","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-01-16T06:57:08.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/135356492?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1718188311.0","currentOid":""},"activityList":{"items":[{"before":"95064fd784bf64d168d20f741183f475021fe2a2","after":"f147c01a39819bd07a81f031204706e188fe61f1","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-21T09:40:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zigzagcai","name":"Season","path":"/zigzagcai","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8370601?s=80&v=4"},"commit":{"message":"update config","shortMessageHtmlLink":"update config"}},{"before":"34c11d88b8636e494b918758bfae6a8b056c7585","after":"95064fd784bf64d168d20f741183f475021fe2a2","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-21T09:20:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zigzagcai","name":"Season","path":"/zigzagcai","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8370601?s=80&v=4"},"commit":{"message":"update metric record for hf","shortMessageHtmlLink":"update metric record for hf"}},{"before":"ff2b94e2672aebd4f90b34506d224601460ad98b","after":"34c11d88b8636e494b918758bfae6a8b056c7585","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-21T08:40:00.000Z","pushType":"push","commitsCount":6,"pusher":{"login":"zigzagcai","name":"Season","path":"/zigzagcai","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8370601?s=80&v=4"},"commit":{"message":"Merge remote-tracking branch 'origin/develop' into internevo-huggingface","shortMessageHtmlLink":"Merge remote-tracking branch 'origin/develop' into internevo-huggingface"}},{"before":"42fbdf7668cd769c2f8c799b76ccbc2c2855487e","after":"ff2b94e2672aebd4f90b34506d224601460ad98b","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-20T13:43:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zigzagcai","name":"Season","path":"/zigzagcai","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/8370601?s=80&v=4"},"commit":{"message":"add support for streaming huggingface dataloader","shortMessageHtmlLink":"add support for streaming huggingface dataloader"}},{"before":"3afaf150fd2cd63154f3f7339476724f80e44649","after":"42fbdf7668cd769c2f8c799b76ccbc2c2855487e","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-20T13:06:44.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"fix load actual dataset error","shortMessageHtmlLink":"fix load actual dataset error"}},{"before":"f566c679b8a190cf4b5db11fa48584e11e9d3dcd","after":"c7649331088841a2daebea7bd85d36749397dcc8","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-20T10:06:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"fix(pipeline.py): fix mfu","shortMessageHtmlLink":"fix(pipeline.py): fix mfu"}},{"before":"652baca0a2231307a38568be0c51b0083eaeccdc","after":"f566c679b8a190cf4b5db11fa48584e11e9d3dcd","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-20T06:50:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"fix(isp.py): remove sync and barrier","shortMessageHtmlLink":"fix(isp.py): remove sync and barrier"}},{"before":"acddf161bf252317b23da2a48372f17b83cafb29","after":"652baca0a2231307a38568be0c51b0083eaeccdc","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-20T04:18:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"fix(train/pipeline.py): remove redundant print","shortMessageHtmlLink":"fix(train/pipeline.py): remove redundant print"}},{"before":"ae1e6b117de7c50f8be5033dbe85b4fef8037f15","after":"acddf161bf252317b23da2a48372f17b83cafb29","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-20T04:07:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"feat(zigzag_ring_flash_attn_with_sliding_window.py): kv and dkv use diff process group to optimize p2p comm overlap","shortMessageHtmlLink":"feat(zigzag_ring_flash_attn_with_sliding_window.py): kv and dkv use d…"}},{"before":"04db9f66504ba95a74178ce2ce203f2011fcea86","after":"a61d391df96c5f5c243cdea32a5044b70d6fe33e","ref":"refs/heads/develop","pushedAt":"2024-06-19T14:09:33.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"gaoyang07","name":"Yang Gao","path":"/gaoyang07","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/32762712?s=80&v=4"},"commit":{"message":"feat(data): load meta files with shared memory (#255)","shortMessageHtmlLink":"feat(data): load meta files with shared memory (#255)"}},{"before":"2ac3dcf8671e330baf7e5bd3195fef485c979545","after":"04db9f66504ba95a74178ce2ce203f2011fcea86","ref":"refs/heads/develop","pushedAt":"2024-06-19T05:49:13.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"sunpengsdu","name":"Sun Peng","path":"/sunpengsdu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6859848?s=80&v=4"},"commit":{"message":"Feat (optimizer): add new optimizer for spliting zero tensor (#237)","shortMessageHtmlLink":"Feat (optimizer): add new optimizer for spliting zero tensor (#237)"}},{"before":"a35c7a56cd304f463f2aea20cd2747137011c9ec","after":"ae1e6b117de7c50f8be5033dbe85b4fef8037f15","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-17T12:22:47.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"test(*): add backward timing (#252)","shortMessageHtmlLink":"test(*): add backward timing (#252)"}},{"before":"3a01d1a73da07491a47d9339d44221ee54a10366","after":"3afaf150fd2cd63154f3f7339476724f80e44649","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-13T03:42:49.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dummy dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"cf764787833918f650d7638e2953ccc9bcd916bd","after":"3a01d1a73da07491a47d9339d44221ee54a10366","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-13T03:40:46.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dummy dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"1b72e9739985ff0c8458671d78ff1a50a788f19c","after":"cf764787833918f650d7638e2953ccc9bcd916bd","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-13T03:38:30.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dummy dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"58a52e3cb32d59b35b2ef8f02aa5cc22e2cabed7","after":null,"ref":"refs/heads/fix/reward_linear","pushedAt":"2024-06-12T10:31:51.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"KimmiShi","name":"KimmiShi","path":"/KimmiShi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/13433751?s=80&v=4"}},{"before":"eaef99e3c99fb5ab4f8ec56deccb9fc28514c946","after":"2ac3dcf8671e330baf7e5bd3195fef485c979545","ref":"refs/heads/develop","pushedAt":"2024-06-12T10:00:24.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"sunpengsdu","name":"Sun Peng","path":"/sunpengsdu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/6859848?s=80&v=4"},"commit":{"message":"fix: RewardModelLinear bcast process_group (#249)\n\nCo-authored-by: shidongxing ","shortMessageHtmlLink":"fix: RewardModelLinear bcast process_group (#249)"}},{"before":null,"after":"58a52e3cb32d59b35b2ef8f02aa5cc22e2cabed7","ref":"refs/heads/fix/reward_linear","pushedAt":"2024-06-12T09:16:50.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"KimmiShi","name":"KimmiShi","path":"/KimmiShi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/13433751?s=80&v=4"},"commit":{"message":"fix RewardModelLinear bcast","shortMessageHtmlLink":"fix RewardModelLinear bcast"}},{"before":"7035d400f2a55362e50e968dc6ff3a58d2ac6a14","after":"a35c7a56cd304f463f2aea20cd2747137011c9ec","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-12T07:01:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"fix(zigzag_ring_flash_attn_with_sliding_window.py): fix inter window backward pp overlap","shortMessageHtmlLink":"fix(zigzag_ring_flash_attn_with_sliding_window.py): fix inter window …"}},{"before":"e96450abdfab27c6da7188a5f1dd998dec8d6fe9","after":"eaef99e3c99fb5ab4f8ec56deccb9fc28514c946","ref":"refs/heads/develop","pushedAt":"2024-06-11T05:23:58.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"gaoyang07","name":"Yang Gao","path":"/gaoyang07","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/32762712?s=80&v=4"},"commit":{"message":"feat(inference): support generation using trainer (#230)","shortMessageHtmlLink":"feat(inference): support generation using trainer (#230)"}},{"before":"6d659939e03bfa7552e308c5848bf60293aa87fe","after":"b2f433d414db3cf1261907d86daa9ddfaecc1968","ref":"refs/heads/feat/marl","pushedAt":"2024-06-11T03:57:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KimmiShi","name":"KimmiShi","path":"/KimmiShi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/13433751?s=80&v=4"},"commit":{"message":"fix testcase","shortMessageHtmlLink":"fix testcase"}},{"before":"7fc8c81b03449ceb27f711bb973d152675fa012a","after":"d30306380948b1a34c4d9befd6eadccd85e94add","ref":"refs/heads/feat/fmoe_tutel_exp","pushedAt":"2024-06-07T10:47:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"KimmiShi","name":"KimmiShi","path":"/KimmiShi","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/13433751?s=80&v=4"},"commit":{"message":"update moe","shortMessageHtmlLink":"update moe"}},{"before":"72db800659881edba918661bc8eb57fb63074e11","after":"7035d400f2a55362e50e968dc6ff3a58d2ac6a14","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-07T08:48:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"fix(pipeline.py): fix tgs print","shortMessageHtmlLink":"fix(pipeline.py): fix tgs print"}},{"before":null,"after":"036b567481ab5f5a0bba57bea797a201180b4f78","ref":"refs/heads/feat/add_tutel_all2all","pushedAt":"2024-06-07T02:41:41.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"SolenoidWGT","name":"Guoteng","path":"/SolenoidWGT","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/32697156?s=80&v=4"},"commit":{"message":"feat(all2all): add single & tutel all2all","shortMessageHtmlLink":"feat(all2all): add single & tutel all2all"}},{"before":"2380a22938971fa31285178a1d24f75e89780b17","after":"1b72e9739985ff0c8458671d78ff1a50a788f19c","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-06T08:02:11.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dummy dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"c5fe7de0fccfce12263d6946136c1ebc69994200","after":"2380a22938971fa31285178a1d24f75e89780b17","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-06T07:59:52.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dummy dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"6b5cb1c43d146945e9b95073c0000c932acfcfb1","after":"c5fe7de0fccfce12263d6946136c1ebc69994200","ref":"refs/heads/internevo-huggingface","pushedAt":"2024-06-06T07:58:44.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"sallyjunjun","name":null,"path":"/sallyjunjun","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/72725839?s=80&v=4"},"commit":{"message":"adapt huggingface\n1. currently can run with no parallel and use unpacked dataset\nTODO:\n1. use parallel strategy\n2. load dataset\n3. load pretrained model\n4. finally, find a way to modify our code, and tell which part should be adapted in modeling file from huggingface","shortMessageHtmlLink":"adapt huggingface"}},{"before":"84cee4c59cfd4645e688cd3e249917b20f3b1076","after":"72db800659881edba918661bc8eb57fb63074e11","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-06T06:52:55.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"test(*):add seq and e2e modifications (#247)","shortMessageHtmlLink":"test(*):add seq and e2e modifications (#247)"}},{"before":"d19b0056e416bc069caf966d7be7c7393f607f41","after":"84cee4c59cfd4645e688cd3e249917b20f3b1076","ref":"refs/heads/feat/loong-train","pushedAt":"2024-06-06T02:41:20.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"Feat/support sliding window attn selective checkpoint (#246)","shortMessageHtmlLink":"Feat/support sliding window attn selective checkpoint (#246)"}},{"before":"e6b28318297c10771acf4f8b7fb301acd70ee37f","after":"03a8b6e431b9b4517d9b08c0e1b246f71414c92f","ref":"refs/heads/feat/support-sliding-window-attn-selective-checkpoint","pushedAt":"2024-06-06T02:39:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"huangting4201","name":null,"path":"/huangting4201","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/20810277?s=80&v=4"},"commit":{"message":"feat(configs/7B_internlm2.py): update config file","shortMessageHtmlLink":"feat(configs/7B_internlm2.py): update config file"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEa24NSwA","startCursor":null,"endCursor":null}},"title":"Activity · InternLM/InternEvo"}