{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":707542304,"defaultBranch":"main","name":"Megatron-LLM","ownerLogin":"xingyaoww","currentUserCanPush":false,"isFork":true,"isEmpty":false,"createdAt":"2023-10-20T06:09:02.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/38853559?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1708358580.0","currentOid":""},"activityList":{"items":[{"before":"b0f85a7c7cc4ea16795bfe38a188483701839091","after":"1cc35e6c19e7e0bc3c7da2e220ad5724c00006d0","ref":"refs/heads/mmistral","pushedAt":"2024-05-22T06:50:04.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"only chat token only if not pretrain","shortMessageHtmlLink":"only chat token only if not pretrain"}},{"before":"48c5fc7ef968cc290ac7fc9dfeb19b18e35d03cb","after":"b0f85a7c7cc4ea16795bfe38a188483701839091","ref":"refs/heads/mmistral","pushedAt":"2024-04-16T04:37:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add error handling for images","shortMessageHtmlLink":"add error handling for images"}},{"before":"ad30492a4be06546a7cb4c7533851c39af317896","after":"48c5fc7ef968cc290ac7fc9dfeb19b18e35d03cb","ref":"refs/heads/mmistral","pushedAt":"2024-04-16T04:16:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix chat template issue","shortMessageHtmlLink":"fix chat template issue"}},{"before":"0b6c4e3f8724dce016ca78ed83c31ee18b1ca73e","after":"ad30492a4be06546a7cb4c7533851c39af317896","ref":"refs/heads/mmistral","pushedAt":"2024-04-09T09:35:55.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"print path for mmap","shortMessageHtmlLink":"print path for mmap"}},{"before":"8081c7932315489b99acdcae8c0b1e88083c27ea","after":"0b6c4e3f8724dce016ca78ed83c31ee18b1ca73e","ref":"refs/heads/mmistral","pushedAt":"2024-03-22T09:22:14.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"remove extra prints","shortMessageHtmlLink":"remove extra prints"}},{"before":"4fae7aaa8a5e5d68cc7112cfd401b37b849f7695","after":"8081c7932315489b99acdcae8c0b1e88083c27ea","ref":"refs/heads/mmistral","pushedAt":"2024-03-03T06:30:43.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix loss_mask shift mis-match","shortMessageHtmlLink":"fix loss_mask shift mis-match"}},{"before":"24535fbbd1d02a281c06eff3c72a77b2aa2badd3","after":"4fae7aaa8a5e5d68cc7112cfd401b37b849f7695","ref":"refs/heads/mmistral","pushedAt":"2024-03-02T19:26:58.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix setting consumed_test_samples","shortMessageHtmlLink":"fix setting consumed_test_samples"}},{"before":"2abb46112928204f951db42f9f82282d206de189","after":"24535fbbd1d02a281c06eff3c72a77b2aa2badd3","ref":"refs/heads/mmistral","pushedAt":"2024-03-02T08:30:09.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"print the first batch for visualization","shortMessageHtmlLink":"print the first batch for visualization"}},{"before":"b2529cb8e3b6704de46161fdca7bb9c62ccf3185","after":"3def3bd198d619fa06c1c6762a6e888c75a75782","ref":"refs/heads/mixtral","pushedAt":"2024-03-01T13:02:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"(wip) attempt to make mixtral working BUT need expert parallel to make this effecienct","shortMessageHtmlLink":"(wip) attempt to make mixtral working BUT need expert parallel to mak…"}},{"before":"7ea862ff85563c2703fec0f1a422971371ded2c3","after":"2abb46112928204f951db42f9f82282d206de189","ref":"refs/heads/mmistral","pushedAt":"2024-02-28T19:12:19.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add consumed_test_samples to support per eval_step testing","shortMessageHtmlLink":"add consumed_test_samples to support per eval_step testing"}},{"before":"5dede6d9c1dc51105d71c3004573dcb3f13fe1bb","after":"7ea862ff85563c2703fec0f1a422971371ded2c3","ref":"refs/heads/mmistral","pushedAt":"2024-02-26T10:15:35.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"handle edge case for conversations format","shortMessageHtmlLink":"handle edge case for conversations format"}},{"before":"31f2dea78c29d9e7a5490717a68e0bd1e6c5ee1f","after":"5dede6d9c1dc51105d71c3004573dcb3f13fe1bb","ref":"refs/heads/mmistral","pushedAt":"2024-02-25T16:31:19.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"change everything to float16 for patches","shortMessageHtmlLink":"change everything to float16 for patches"}},{"before":"5e14e1769b0b27f4ccd7dfa78f1a6bcbfc8615fb","after":"31f2dea78c29d9e7a5490717a68e0bd1e6c5ee1f","ref":"refs/heads/mmistral","pushedAt":"2024-02-25T14:56:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add n_images stats;\nallow packing algorithm to keep long truncated docs;","shortMessageHtmlLink":"add n_images stats;"}},{"before":"b1d01cce1a64518516dca49d597e980c099605c5","after":"5e14e1769b0b27f4ccd7dfa78f1a6bcbfc8615fb","ref":"refs/heads/mmistral","pushedAt":"2024-02-25T14:27:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix n_image_tokens bug","shortMessageHtmlLink":"fix n_image_tokens bug"}},{"before":"31f442442136c0fabb67e50f39701884e59c8519","after":"b1d01cce1a64518516dca49d597e980c099605c5","ref":"refs/heads/mmistral","pushedAt":"2024-02-25T14:19:48.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support a new format of data","shortMessageHtmlLink":"support a new format of data"}},{"before":"ef9ce0cb5c871f8e4ed75b83247a151a5f9265df","after":"31f442442136c0fabb67e50f39701884e59c8519","ref":"refs/heads/mmistral","pushedAt":"2024-02-25T11:55:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support loading and saving index dataset in lz4 for disk space","shortMessageHtmlLink":"support loading and saving index dataset in lz4 for disk space"}},{"before":"77584d55a833d677139d3863ab1b677b0da7c0ef","after":"ef9ce0cb5c871f8e4ed75b83247a151a5f9265df","ref":"refs/heads/mmistral","pushedAt":"2024-02-24T16:02:17.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support disable mp to speed up","shortMessageHtmlLink":"support disable mp to speed up"}},{"before":"cc49a7503aa6fd8065c7372748701544d846e082","after":"77584d55a833d677139d3863ab1b677b0da7c0ef","ref":"refs/heads/mmistral","pushedAt":"2024-02-24T08:17:44.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add implementation that can work for multimodal instruction","shortMessageHtmlLink":"add implementation that can work for multimodal instruction"}},{"before":"6209c5a9b71360134be17122f4b7b7c86d98d569","after":"cc49a7503aa6fd8065c7372748701544d846e082","ref":"refs/heads/mmistral","pushedAt":"2024-02-23T09:18:04.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support a different format of data","shortMessageHtmlLink":"support a different format of data"}},{"before":"b2e2649c0366fcf5696f948293055b8f665373dd","after":"6209c5a9b71360134be17122f4b7b7c86d98d569","ref":"refs/heads/mmistral","pushedAt":"2024-02-22T14:54:52.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add preliminary implementation for multimodal mistral","shortMessageHtmlLink":"add preliminary implementation for multimodal mistral"}},{"before":"1addc8fc8ee485df31c8eec85b692f88bdf05afa","after":"b2e2649c0366fcf5696f948293055b8f665373dd","ref":"refs/heads/mmistral","pushedAt":"2024-02-22T14:09:20.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix padded vocab size for multimodal mistral","shortMessageHtmlLink":"fix padded vocab size for multimodal mistral"}},{"before":"c60dbeda7d20b52af02744ff9ce976dbc3d4846a","after":"1addc8fc8ee485df31c8eec85b692f88bdf05afa","ref":"refs/heads/mmistral","pushedAt":"2024-02-22T09:23:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support adding row_sep","shortMessageHtmlLink":"support adding row_sep"}},{"before":"bca8a57f4411337825fd0e0f059ed7a0df0f3d98","after":"c60dbeda7d20b52af02744ff9ce976dbc3d4846a","ref":"refs/heads/mmistral","pushedAt":"2024-02-22T03:56:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"print # of documents at the end","shortMessageHtmlLink":"print # of documents at the end"}},{"before":"5532fb07a1a47fb652a4881ebcc6bc5199eb5c49","after":"bca8a57f4411337825fd0e0f059ed7a0df0f3d98","ref":"refs/heads/mmistral","pushedAt":"2024-02-22T02:17:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"fix typo","shortMessageHtmlLink":"fix typo"}},{"before":"1ea87c59b47b6da416b9d554d3d2f2801788895c","after":"5532fb07a1a47fb652a4881ebcc6bc5199eb5c49","ref":"refs/heads/mmistral","pushedAt":"2024-02-21T18:39:47.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support packing","shortMessageHtmlLink":"support packing"}},{"before":"ddea50acba107216eaf0aab9ebf1c9d52bb3d789","after":"1ea87c59b47b6da416b9d554d3d2f2801788895c","ref":"refs/heads/mmistral","pushedAt":"2024-02-21T17:20:45.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"support convert mmistral to megatron","shortMessageHtmlLink":"support convert mmistral to megatron"}},{"before":null,"after":"ddea50acba107216eaf0aab9ebf1c9d52bb3d789","ref":"refs/heads/mmistral","pushedAt":"2024-02-19T16:03:00.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"add preliminary implementation for multi-modal data processing","shortMessageHtmlLink":"add preliminary implementation for multi-modal data processing"}},{"before":null,"after":"1b07577760437c61189f949643a52f49ba2f2a7e","ref":"refs/heads/multimodal-mistral","pushedAt":"2024-02-13T07:34:13.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"update megatron dependency","shortMessageHtmlLink":"update megatron dependency"}},{"before":null,"after":"b2529cb8e3b6704de46161fdca7bb9c62ccf3185","ref":"refs/heads/mixtral","pushedAt":"2024-01-17T05:58:47.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"(wip) stash","shortMessageHtmlLink":"(wip) stash"}},{"before":"03f698f7f417eb0020e1fb2efcb2f4cf39d24941","after":"1b07577760437c61189f949643a52f49ba2f2a7e","ref":"refs/heads/main","pushedAt":"2024-01-16T15:40:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"xingyaoww","name":"Xingyao Wang","path":"/xingyaoww","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/38853559?s=80&v=4"},"commit":{"message":"update megatron dependency","shortMessageHtmlLink":"update megatron dependency"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEUJcs8wA","startCursor":null,"endCursor":null}},"title":"Activity · xingyaoww/Megatron-LLM"}