{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":647984858,"defaultBranch":"main","name":"llm-awq","ownerLogin":"mit-han-lab","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-06-01T00:42:45.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/39571499?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1715023354.0","currentOid":""},"activityList":{"items":[{"before":"0f1b75a406b2dcbc35a0ebffc42a36e846769a72","after":null,"ref":"refs/heads/dev/0506","pushedAt":"2024-05-06T19:22:34.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"05ba4972099b2de05e393ea4ed24da4c181f86aa","after":"b2b34f37ae465dae4379918a73c987d8a8123c09","ref":"refs/heads/main","pushedAt":"2024-05-06T19:22:22.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"upload model_worker_new.py (#182)","shortMessageHtmlLink":"upload model_worker_new.py (#182)"}},{"before":"05ba4972099b2de05e393ea4ed24da4c181f86aa","after":"0f1b75a406b2dcbc35a0ebffc42a36e846769a72","ref":"refs/heads/dev/0506","pushedAt":"2024-05-06T19:20:12.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"upload model_worker_new.py","shortMessageHtmlLink":"upload model_worker_new.py"}},{"before":null,"after":"05ba4972099b2de05e393ea4ed24da4c181f86aa","ref":"refs/heads/dev/0506","pushedAt":"2024-05-06T19:18:22.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"VILA1.5 launch (#180)\n\n* [Major] VILA1.5 launch.\r\n\r\n* [Minor] Update gradio serving README for VILA 1.5\r\n\r\n---------\r\n\r\nCo-authored-by: Shang Yang <61508922+ys-2020@users.noreply.github.com>","shortMessageHtmlLink":"VILA1.5 launch (#180)"}},{"before":"c07f8209fe62295577b91b887a0d32c2ace9be92","after":"05ba4972099b2de05e393ea4ed24da4c181f86aa","ref":"refs/heads/main","pushedAt":"2024-05-03T15:57:20.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"VILA1.5 launch (#180)\n\n* [Major] VILA1.5 launch.\r\n\r\n* [Minor] Update gradio serving README for VILA 1.5\r\n\r\n---------\r\n\r\nCo-authored-by: Shang Yang <61508922+ys-2020@users.noreply.github.com>","shortMessageHtmlLink":"VILA1.5 launch (#180)"}},{"before":"d874dd38237281a18009252716feff7e997f7e26","after":"3095ea29097d80ff1fecf748fb9c51c9a07f210e","ref":"refs/heads/dev/vila_1.5","pushedAt":"2024-05-03T15:56:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"[Minor] Update gradio serving README for VILA 1.5","shortMessageHtmlLink":"[Minor] Update gradio serving README for VILA 1.5"}},{"before":"c07f8209fe62295577b91b887a0d32c2ace9be92","after":"d874dd38237281a18009252716feff7e997f7e26","ref":"refs/heads/dev/vila_1.5","pushedAt":"2024-05-03T15:42:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"[Major] VILA1.5 launch.","shortMessageHtmlLink":"[Major] VILA1.5 launch."}},{"before":null,"after":"c07f8209fe62295577b91b887a0d32c2ace9be92","ref":"refs/heads/dev/vila_1.5","pushedAt":"2024-05-03T15:41:57.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"Update README.md (#179)","shortMessageHtmlLink":"Update README.md (#179)"}},{"before":"494d2a79a2ab1532ae306eb158a872e7183b25c6","after":null,"ref":"refs/heads/update_0501","pushedAt":"2024-05-01T16:17:25.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"b76fab62aa371435217c20dd2d108aaad008d840","after":"c07f8209fe62295577b91b887a0d32c2ace9be92","ref":"refs/heads/main","pushedAt":"2024-05-01T16:17:21.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update README.md (#179)","shortMessageHtmlLink":"Update README.md (#179)"}},{"before":"b76fab62aa371435217c20dd2d108aaad008d840","after":"494d2a79a2ab1532ae306eb158a872e7183b25c6","ref":"refs/heads/update_0501","pushedAt":"2024-05-01T16:16:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":null,"after":"b76fab62aa371435217c20dd2d108aaad008d840","ref":"refs/heads/update_0501","pushedAt":"2024-05-01T16:15:47.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"[Major] Support Llama3 and update on-the-fly rope scaling (#177)","shortMessageHtmlLink":"[Major] Support Llama3 and update on-the-fly rope scaling (#177)"}},{"before":"83da769fa2e6439c8c20f53a7bc1f873122d9622","after":"b76fab62aa371435217c20dd2d108aaad008d840","ref":"refs/heads/main","pushedAt":"2024-04-29T04:01:45.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"[Major] Support Llama3 and update on-the-fly rope scaling (#177)","shortMessageHtmlLink":"[Major] Support Llama3 and update on-the-fly rope scaling (#177)"}},{"before":"83da769fa2e6439c8c20f53a7bc1f873122d9622","after":"98d9a64ff0619eca04fa98002d9679e61335cedb","ref":"refs/heads/dev/llama_3","pushedAt":"2024-04-29T04:00:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"[Major] Support Llama3 and update on-the-fly rope scaling","shortMessageHtmlLink":"[Major] Support Llama3 and update on-the-fly rope scaling"}},{"before":null,"after":"83da769fa2e6439c8c20f53a7bc1f873122d9622","ref":"refs/heads/dev/llama_3","pushedAt":"2024-04-29T03:58:28.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"[Minor] Update README. (#168)\n\n* Update vLLM link.\r\n\r\n* Update industrial impacts","shortMessageHtmlLink":"[Minor] Update README. (#168)"}},{"before":"7e3577056d005752fbe72ef782e49d9fd0e76257","after":null,"ref":"refs/heads/dev/update_readme_0329","pushedAt":"2024-03-30T01:49:45.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"5efd875ac957c36fd5af35ea099b50cdeac12144","after":null,"ref":"refs/heads/dev/tinychat_update_0918","pushedAt":"2024-03-30T01:49:28.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"87070e6ad1268989151961a1a0d1695331c9f066","after":null,"ref":"refs/heads/dev/vila_release_0222","pushedAt":"2024-03-30T01:49:12.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"79019832efd37e4c24a695442880190858aa605e","after":"83da769fa2e6439c8c20f53a7bc1f873122d9622","ref":"refs/heads/main","pushedAt":"2024-03-30T01:48:33.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"kentang-mit","name":"Haotian (Ken) Tang","path":"/kentang-mit","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/30133450?s=80&v=4"},"commit":{"message":"[Minor] Update README. (#168)\n\n* Update vLLM link.\r\n\r\n* Update industrial impacts","shortMessageHtmlLink":"[Minor] Update README. (#168)"}},{"before":"8f6b613c5b0c1dcbd1db3923caf6bd93b35287ca","after":null,"ref":"refs/heads/dev/update_news_0229","pushedAt":"2024-03-30T01:48:33.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"ef970cf841b3cd162906c3deaee1169a4a3c0494","after":null,"ref":"refs/heads/ys-2020-patch-1","pushedAt":"2024-03-30T01:46:21.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"671e9461d2498317beedcf3e687051873ac66b78","after":"7e3577056d005752fbe72ef782e49d9fd0e76257","ref":"refs/heads/dev/update_readme_0329","pushedAt":"2024-03-30T01:45:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update industrial impacts","shortMessageHtmlLink":"Update industrial impacts"}},{"before":null,"after":"ef970cf841b3cd162906c3deaee1169a4a3c0494","ref":"refs/heads/ys-2020-patch-1","pushedAt":"2024-03-30T01:44:43.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update industry impact","shortMessageHtmlLink":"Update industry impact"}},{"before":"79019832efd37e4c24a695442880190858aa605e","after":"671e9461d2498317beedcf3e687051873ac66b78","ref":"refs/heads/dev/update_readme_0329","pushedAt":"2024-03-30T01:17:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update vLLM link.","shortMessageHtmlLink":"Update vLLM link."}},{"before":null,"after":"79019832efd37e4c24a695442880190858aa605e","ref":"refs/heads/dev/update_readme_0329","pushedAt":"2024-03-30T01:15:13.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Fix transformers version (#156)\n\nWhen running AWQ search foe Llama2 with transformers>=4.38.0, I find the bug below:\r\nFile \"/×××/llm-awq/awq/quantize/auto_scale.py\", line 134, in _search_module_scale\r\nRuntimeError: The expanded size of the tensor (4608) must match the existing size (4096) at non-singleton dimension 3. Target sizes: [65, 32, 512, 4608]. Tensor sizes: [65, 1, 512, 4096]\r\nBut earlier versions of transformers would not happen this. So I set transformers==4.36.2.","shortMessageHtmlLink":"Fix transformers version (#156)"}},{"before":"178e5223f95942d8f3242ad587dc8d91d8c9b700","after":"79019832efd37e4c24a695442880190858aa605e","ref":"refs/heads/main","pushedAt":"2024-03-11T14:27:03.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Fix transformers version (#156)\n\nWhen running AWQ search foe Llama2 with transformers>=4.38.0, I find the bug below:\r\nFile \"/×××/llm-awq/awq/quantize/auto_scale.py\", line 134, in _search_module_scale\r\nRuntimeError: The expanded size of the tensor (4608) must match the existing size (4096) at non-singleton dimension 3. Target sizes: [65, 32, 512, 4608]. Tensor sizes: [65, 1, 512, 4096]\r\nBut earlier versions of transformers would not happen this. So I set transformers==4.36.2.","shortMessageHtmlLink":"Fix transformers version (#156)"}},{"before":"1afc982ff2cc491e803e48e8ba151f130b49636b","after":null,"ref":"refs/heads/dev/update_speed_0304","pushedAt":"2024-03-11T04:05:29.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"}},{"before":"f40ffa52daec066630b21e6b01ec497e7fddf89d","after":"178e5223f95942d8f3242ad587dc8d91d8c9b700","ref":"refs/heads/main","pushedAt":"2024-03-11T04:05:20.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update TinyChat Speed for VILA (#150)","shortMessageHtmlLink":"Update TinyChat Speed for VILA (#150)"}},{"before":"f40ffa52daec066630b21e6b01ec497e7fddf89d","after":"1afc982ff2cc491e803e48e8ba151f130b49636b","ref":"refs/heads/dev/update_speed_0304","pushedAt":"2024-03-04T19:05:44.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"Update TinyChat Speed for VILA","shortMessageHtmlLink":"Update TinyChat Speed for VILA"}},{"before":null,"after":"f40ffa52daec066630b21e6b01ec497e7fddf89d","ref":"refs/heads/dev/update_speed_0304","pushedAt":"2024-03-04T16:07:00.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ys-2020","name":"Shang Yang","path":"/ys-2020","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/61508922?s=80&v=4"},"commit":{"message":"[Minor] Update news. (#149)\n\n* [Minor] Update README.md\r\n\r\n* Update README.md\r\n\r\n---------\r\n\r\nCo-authored-by: Haotian (Ken) Tang ","shortMessageHtmlLink":"[Minor] Update news. (#149)"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEQt0IDQA","startCursor":null,"endCursor":null}},"title":"Activity · mit-han-lab/llm-awq"}