{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":806950549,"defaultBranch":"main","name":"CUDA_kernels","ownerLogin":"tkob-vh","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-05-28T08:01:26.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/107342170?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1716883286.0","currentOid":""},"activityList":{"items":[{"before":"3c4204bb6b144c8dde7ab3bdb06fa6e84f6e4248","after":"dbc050f2cd5a0526e8c3fb8a92198edac0359669","ref":"refs/heads/main","pushedAt":"2024-07-28T05:21:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: Add 3 versions of reduction kernel","shortMessageHtmlLink":"feat: Add 3 versions of reduction kernel"}},{"before":"f14c6e3f0b15069208aa69662ad642d6177f8a0f","after":"3c4204bb6b144c8dde7ab3bdb06fa6e84f6e4248","ref":"refs/heads/main","pushedAt":"2024-07-27T16:13:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"refactor: Change the format of histogram","shortMessageHtmlLink":"refactor: Change the format of histogram"}},{"before":"a87dd562c96edceb53974cf37b51273f1a2c179a","after":"f14c6e3f0b15069208aa69662ad642d6177f8a0f","ref":"refs/heads/main","pushedAt":"2024-07-27T08:51:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"refactor: Change the format of Stencil","shortMessageHtmlLink":"refactor: Change the format of Stencil"}},{"before":"105c892e41631c3200bf1f32382b814f83c9f06c","after":"a87dd562c96edceb53974cf37b51273f1a2c179a","ref":"refs/heads/main","pushedAt":"2024-07-27T08:23:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"refactor: Change the format of Convolution","shortMessageHtmlLink":"refactor: Change the format of Convolution"}},{"before":"734920b1d6339a1a37a8864ba905afba42828adc","after":"105c892e41631c3200bf1f32382b814f83c9f06c","ref":"refs/heads/main","pushedAt":"2024-07-24T13:07:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"refactor: Change the format of GEMM","shortMessageHtmlLink":"refactor: Change the format of GEMM"}},{"before":"0dabe1a7e5841da04181b11ce837262f4662f7e5","after":"734920b1d6339a1a37a8864ba905afba42828adc","ref":"refs/heads/main","pushedAt":"2024-07-22T15:40:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"refactor: Change the sturcture of the directory","shortMessageHtmlLink":"refactor: Change the sturcture of the directory"}},{"before":"0eeecad4d0805681bba21bad4cffc3619b1add31","after":"0dabe1a7e5841da04181b11ce837262f4662f7e5","ref":"refs/heads/main","pushedAt":"2024-07-20T06:36:44.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: Add aggregation to parallel histogram","shortMessageHtmlLink":"feat: Add aggregation to parallel histogram"}},{"before":"d72e66624d7a93dc55679a8092cf7925b42b3de9","after":"0eeecad4d0805681bba21bad4cffc3619b1add31","ref":"refs/heads/main","pushedAt":"2024-07-20T06:19:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: Add thread coarsening for parallel histogram","shortMessageHtmlLink":"feat: Add thread coarsening for parallel histogram"}},{"before":"7220c381ff2ee779935953f6a6b6925a87a79614","after":"d72e66624d7a93dc55679a8092cf7925b42b3de9","ref":"refs/heads/main","pushedAt":"2024-06-28T15:48:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"fix: fix slurm script to use ncu","shortMessageHtmlLink":"fix: fix slurm script to use ncu"}},{"before":"e3f32718aed764a32453e431bc8fe4d3b70be919","after":"7220c381ff2ee779935953f6a6b6925a87a79614","ref":"refs/heads/main","pushedAt":"2024-06-28T08:57:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"fix: fix makefile and gitignore, reduce redundant computations","shortMessageHtmlLink":"fix: fix makefile and gitignore, reduce redundant computations"}},{"before":"59516babb9e49e7a7b13d3597a20ce3176a69462","after":"e3f32718aed764a32453e431bc8fe4d3b70be919","ref":"refs/heads/main","pushedAt":"2024-06-27T16:16:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"fix: fix makefile","shortMessageHtmlLink":"fix: fix makefile"}},{"before":"2242691ce268a0078921501e9a3f5dfbdec904f0","after":"59516babb9e49e7a7b13d3597a20ce3176a69462","ref":"refs/heads/main","pushedAt":"2024-06-27T16:00:48.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: unroll some loops","shortMessageHtmlLink":"feat: unroll some loops"}},{"before":"81b926a2bb6909ef3a86ab84a3acac3a2e132fa4","after":"2242691ce268a0078921501e9a3f5dfbdec904f0","ref":"refs/heads/main","pushedAt":"2024-06-27T15:44:37.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: implement 1D shared memory, with some bugs","shortMessageHtmlLink":"feat: implement 1D shared memory, with some bugs"}},{"before":"520148d2dbdde5ebbd4ef58cc07391c5a1d12336","after":"81b926a2bb6909ef3a86ab84a3acac3a2e132fa4","ref":"refs/heads/main","pushedAt":"2024-06-27T07:02:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: update slurm script","shortMessageHtmlLink":"feat: update slurm script"}},{"before":"fd050df3eb18fc7af1325418aa66c99c60a8f5d8","after":"520148d2dbdde5ebbd4ef58cc07391c5a1d12336","ref":"refs/heads/main","pushedAt":"2024-06-25T14:38:20.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: update .gitignore","shortMessageHtmlLink":"feat: update .gitignore"}},{"before":"8cfc0c498da8980331953ec9d26436a0af099069","after":"fd050df3eb18fc7af1325418aa66c99c60a8f5d8","ref":"refs/heads/main","pushedAt":"2024-06-18T13:48:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: fine-tune the Z_ITER block size to improve the occupancy.","shortMessageHtmlLink":"feat: fine-tune the Z_ITER block size to improve the occupancy."}},{"before":"24df7fa1c56615621526591d83013694d360882b","after":"8cfc0c498da8980331953ec9d26436a0af099069","ref":"refs/heads/main","pushedAt":"2024-06-18T08:09:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: fine-tune the Z_ITER size","shortMessageHtmlLink":"feat: fine-tune the Z_ITER size"}},{"before":"720157657d7892781109395d05b9d9022c903240","after":"24df7fa1c56615621526591d83013694d360882b","ref":"refs/heads/main","pushedAt":"2024-06-18T07:48:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: use shared memory to speed up calculation.","shortMessageHtmlLink":"feat: use shared memory to speed up calculation."}},{"before":"f0e66391de38fde5abef763898fac6a26aa23569","after":"720157657d7892781109395d05b9d9022c903240","ref":"refs/heads/main","pushedAt":"2024-06-17T07:04:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: change the naive version to improve memory throughput","shortMessageHtmlLink":"feat: change the naive version to improve memory throughput"}},{"before":"0b5371ff9affa4d06c313ff6f4e2e10668fea37d","after":"f0e66391de38fde5abef763898fac6a26aa23569","ref":"refs/heads/main","pushedAt":"2024-06-14T09:09:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: implement naive conway game of life","shortMessageHtmlLink":"feat: implement naive conway game of life"}},{"before":"1637040e681562f65796e28d3b22cb34f8fb329f","after":"0b5371ff9affa4d06c313ff6f4e2e10668fea37d","ref":"refs/heads/main","pushedAt":"2024-06-14T07:57:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: add official version of conway game of life","shortMessageHtmlLink":"feat: add official version of conway game of life"}},{"before":"e92c645dfc96bc0bddd2183683f2f9972818577f","after":"1637040e681562f65796e28d3b22cb34f8fb329f","ref":"refs/heads/main","pushedAt":"2024-06-13T15:21:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: add baseline of Conway game of life (3D version)","shortMessageHtmlLink":"feat: add baseline of Conway game of life (3D version)"}},{"before":"8c01264a56fe7f760ed285ee513275bb650f43b5","after":"e92c645dfc96bc0bddd2183683f2f9972818577f","ref":"refs/heads/main","pushedAt":"2024-06-12T12:21:35.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: implement parallel histogram with shared memory and privatization","shortMessageHtmlLink":"feat: implement parallel histogram with shared memory and privatization"}},{"before":"c29e66ad4ca772197ebda813a649d65b72d0775e","after":"8c01264a56fe7f760ed285ee513275bb650f43b5","ref":"refs/heads/main","pushedAt":"2024-06-11T14:08:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: implement naive parallel histogram using cuda","shortMessageHtmlLink":"feat: implement naive parallel histogram using cuda"}},{"before":"1e10492d4c939c2fea0ce74901f0f0469c7965fd","after":"c29e66ad4ca772197ebda813a649d65b72d0775e","ref":"refs/heads/main","pushedAt":"2024-06-10T09:12:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: finish stencil with shared memory, thread coarsening and register tiling","shortMessageHtmlLink":"feat: finish stencil with shared memory, thread coarsening and regist…"}},{"before":"4c260bbfa4d4f4de7e0cd89cb8d59dac2829392b","after":"1e10492d4c939c2fea0ce74901f0f0469c7965fd","ref":"refs/heads/main","pushedAt":"2024-06-10T07:58:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: finish stencil with shared memory and thread coarsening","shortMessageHtmlLink":"feat: finish stencil with shared memory and thread coarsening"}},{"before":"8ddd2698ad763470073f4e416f932abe6d8628a8","after":"4c260bbfa4d4f4de7e0cd89cb8d59dac2829392b","ref":"refs/heads/main","pushedAt":"2024-06-09T13:05:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: finish stencil with shared memory","shortMessageHtmlLink":"feat: finish stencil with shared memory"}},{"before":"ac969d5be61b933a60a69781cbdb443531dd2348","after":"8ddd2698ad763470073f4e416f932abe6d8628a8","ref":"refs/heads/main","pushedAt":"2024-06-08T14:21:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"feat: implement naive stencil cuda kernel","shortMessageHtmlLink":"feat: implement naive stencil cuda kernel"}},{"before":"6a0dcf21b1e86fa42a81bca3f386d5ca0cde5e87","after":"ac969d5be61b933a60a69781cbdb443531dd2348","ref":"refs/heads/main","pushedAt":"2024-06-03T15:15:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"fix: fix some problems in convolution_v2","shortMessageHtmlLink":"fix: fix some problems in convolution_v2"}},{"before":"fbb71195151dd7fc9b3f46ad3441f8cffca34f40","after":"6a0dcf21b1e86fa42a81bca3f386d5ca0cde5e87","ref":"refs/heads/main","pushedAt":"2024-06-02T11:34:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"tkob-vh","name":"Yuxin Yan","path":"/tkob-vh","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/107342170?s=80&v=4"},"commit":{"message":"fix: fix some problems in convolution_v2","shortMessageHtmlLink":"fix: fix some problems in convolution_v2"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEiwAPVwA","startCursor":null,"endCursor":null}},"title":"Activity · tkob-vh/CUDA_kernels"}