{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":141401060,"defaultBranch":"master","name":"how-to-optim-algorithm-in-cuda","ownerLogin":"BBuf","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2018-07-18T07:55:40.000Z","ownerAvatar":"https://github.com/avatars/u/35585791?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1531900989.0","currentOid":""},"activityList":{"items":[{"before":"f1ac17aa257d9205fde30ae054838d64108cdbef","after":"a5b9bd8eff1e19be34d3a582243bc1db767ac39e","ref":"refs/heads/master","pushedAt":"2024-08-08T14:18:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add TensorRT-LLM 中的 Hopper Mixed GEMM 的 CUTLASS 3.x 实现讲解.md","shortMessageHtmlLink":"add TensorRT-LLM 中的 Hopper Mixed GEMM 的 CUTLASS 3.x 实现讲解.md"}},{"before":"3e0a6d2a06ab399f0e8e4fc3c82c3b0f9a6b469c","after":"f1ac17aa257d9205fde30ae054838d64108cdbef","ref":"refs/heads/master","pushedAt":"2024-08-05T16:02:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"end Lecture 8 CUDA Performance Checklist.md","shortMessageHtmlLink":"end Lecture 8 CUDA Performance Checklist.md"}},{"before":"facebf3f960061879f9b25e74702202315cca485","after":"3e0a6d2a06ab399f0e8e4fc3c82c3b0f9a6b469c","ref":"refs/heads/master","pushedAt":"2024-08-05T15:18:12.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"end Lecture 8 CUDA Performance Checklist.md","shortMessageHtmlLink":"end Lecture 8 CUDA Performance Checklist.md"}},{"before":"9d395918bcd61dd83b9df0aea545bd6b8e93aaef","after":"facebf3f960061879f9b25e74702202315cca485","ref":"refs/heads/master","pushedAt":"2024-08-04T14:53:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add Lecture 8 CUDA Performance Checklist.md","shortMessageHtmlLink":"add Lecture 8 CUDA Performance Checklist.md"}},{"before":"37646cbeb81fd1faae113c9568565e2b4602c4a5","after":"9d395918bcd61dd83b9df0aea545bd6b8e93aaef","ref":"refs/heads/master","pushedAt":"2024-08-03T14:13:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add Lecture 8_ CUDA Performance.pptx","shortMessageHtmlLink":"add Lecture 8_ CUDA Performance.pptx"}},{"before":"06ec853284e5ff9ac4257a1248211d22c9e7aa96","after":"37646cbeb81fd1faae113c9568565e2b4602c4a5","ref":"refs/heads/master","pushedAt":"2024-08-02T11:05:44.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update readme","shortMessageHtmlLink":"update readme"}},{"before":"daab856d3692b692db721948f9ba535985c922c2","after":"06ec853284e5ff9ac4257a1248211d22c9e7aa96","ref":"refs/heads/master","pushedAt":"2024-08-01T14:16:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"end TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2.x 实现讲解.md","shortMessageHtmlLink":"end TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2.x …"}},{"before":"840f24ab21630af3265f135c82d48f33d38b46ff","after":"daab856d3692b692db721948f9ba535985c922c2","ref":"refs/heads/master","pushedAt":"2024-07-31T14:58:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2.x 实现讲解.md","shortMessageHtmlLink":"update TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2…"}},{"before":"1b4ba1d15f0a095ff3c2a91363bccb9c8d9e63b9","after":"840f24ab21630af3265f135c82d48f33d38b46ff","ref":"refs/heads/master","pushedAt":"2024-07-29T10:56:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2.x 实现讲解.md","shortMessageHtmlLink":"add TensorRT-LLM中的 Quantization GEMM(Ampere Mixed GEMM)的 CUTLASS 2.x …"}},{"before":"42b3177f6363e1236679452a92a165b82fcc805c","after":"1b4ba1d15f0a095ff3c2a91363bccb9c8d9e63b9","ref":"refs/heads/master","pushedAt":"2024-07-26T14:31:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update Lecture 7 Quantization Cuda vs Triton.md","shortMessageHtmlLink":"update Lecture 7 Quantization Cuda vs Triton.md"}},{"before":"20bfa9f09dfbd29f30c75717b164cace6f4623b9","after":"42b3177f6363e1236679452a92a165b82fcc805c","ref":"refs/heads/master","pushedAt":"2024-07-24T14:25:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update Lecture 7 Quantization Cuda vs Triton.md","shortMessageHtmlLink":"update Lecture 7 Quantization Cuda vs Triton.md"}},{"before":"46ddb1a342b16b1dd1c289b33fe0087562e90af2","after":"20bfa9f09dfbd29f30c75717b164cace6f4623b9","ref":"refs/heads/master","pushedAt":"2024-07-23T12:23:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"end CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md","shortMessageHtmlLink":"end CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md"}},{"before":"8c0c9b37cb569f6b5a5a17b7622cb6a6e7449182","after":"46ddb1a342b16b1dd1c289b33fe0087562e90af2","ref":"refs/heads/master","pushedAt":"2024-07-22T12:06:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md","shortMessageHtmlLink":"update CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md"}},{"before":"b50321af4368099309a14ae95fb5e553736d3bb5","after":"8c0c9b37cb569f6b5a5a17b7622cb6a6e7449182","ref":"refs/heads/master","pushedAt":"2024-07-20T16:10:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md","shortMessageHtmlLink":"add CUTLASS 2.x & CUTLASS 3.x Intro 学习笔记.md"}},{"before":"1b994f9c5b64918a3b4b0590d1603757921d1d5e","after":"b50321af4368099309a14ae95fb5e553736d3bb5","ref":"refs/heads/master","pushedAt":"2024-07-20T02:13:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"finish add NVIDIA AI 加速精讲堂-TensorRT-LLM 应用与部署.md slides","shortMessageHtmlLink":"finish add NVIDIA AI 加速精讲堂-TensorRT-LLM 应用与部署.md slides"}},{"before":"476819bb018b0ad589e6b16541c720f34c73501a","after":"1b994f9c5b64918a3b4b0590d1603757921d1d5e","ref":"refs/heads/master","pushedAt":"2024-07-19T15:41:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add NVIDIA AI 加速精讲堂-TensorRT-LLM 应用与部署.md","shortMessageHtmlLink":"add NVIDIA AI 加速精讲堂-TensorRT-LLM 应用与部署.md"}},{"before":"e45cb5dd4af8e6b8aa284948e929da97f2ebb764","after":"476819bb018b0ad589e6b16541c720f34c73501a","ref":"refs/heads/master","pushedAt":"2024-07-18T09:26:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"fix typo","shortMessageHtmlLink":"fix typo"}},{"before":"e09049b1d1d815a72469617c13ccafce03ebf7f3","after":"e45cb5dd4af8e6b8aa284948e929da97f2ebb764","ref":"refs/heads/master","pushedAt":"2024-07-18T09:04:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"finish Lecture 6 Optimizing Optimizer","shortMessageHtmlLink":"finish Lecture 6 Optimizing Optimizer"}},{"before":"e5ff1c165dd3931e10ea8135406ecea352771216","after":"e09049b1d1d815a72469617c13ccafce03ebf7f3","ref":"refs/heads/master","pushedAt":"2024-07-17T13:41:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"Update Lecture 6 Optimizing Optimizer","shortMessageHtmlLink":"Update Lecture 6 Optimizing Optimizer"}},{"before":"a5b027ae27e4ecdc4488bce751480811b916cdc9","after":"e5ff1c165dd3931e10ea8135406ecea352771216","ref":"refs/heads/master","pushedAt":"2024-07-14T15:52:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add Lecture 6 Optimizing Optimizer.md","shortMessageHtmlLink":"add Lecture 6 Optimizing Optimizer.md"}},{"before":"832ef6b4a58e62eb86b4488d26d6ef427ab757c7","after":"a5b027ae27e4ecdc4488bce751480811b916cdc9","ref":"refs/heads/master","pushedAt":"2024-07-12T15:18:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"add lecture15 cutlass","shortMessageHtmlLink":"add lecture15 cutlass"}},{"before":"568c80a87749e7b67ea53bed28fbb5f3a67cc4f3","after":"832ef6b4a58e62eb86b4488d26d6ef427ab757c7","ref":"refs/heads/master","pushedAt":"2024-07-11T15:13:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update cuda-model lecture4","shortMessageHtmlLink":"update cuda-model lecture4"}},{"before":"d64c9a03ebf3fddd09bb31b7d15d13e42ae1a6ed","after":"568c80a87749e7b67ea53bed28fbb5f3a67cc4f3","ref":"refs/heads/master","pushedAt":"2024-07-11T10:03:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"restruct structure","shortMessageHtmlLink":"restruct structure"}},{"before":"09ee13a7ca1c3556142afd1edff2181cbfad45db","after":"d64c9a03ebf3fddd09bb31b7d15d13e42ae1a6ed","ref":"refs/heads/master","pushedAt":"2024-07-08T15:16:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update Lecture 4 Ch4-5 PMPP book.md","shortMessageHtmlLink":"update Lecture 4 Ch4-5 PMPP book.md"}},{"before":"c704a9b629188428ccbacad936cb4136a760bc21","after":"09ee13a7ca1c3556142afd1edff2181cbfad45db","ref":"refs/heads/master","pushedAt":"2024-07-07T15:37:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"lecture 4 update","shortMessageHtmlLink":"lecture 4 update"}},{"before":"7993e3cdab515d9ed4af6d9b2e5c0a666f0a54fb","after":"c704a9b629188428ccbacad936cb4136a760bc21","ref":"refs/heads/master","pushedAt":"2024-07-06T09:28:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"lecture 2 complete","shortMessageHtmlLink":"lecture 2 complete"}},{"before":"15c8b57316b08ad0bf3b967becfd523f42ee6814","after":"7993e3cdab515d9ed4af6d9b2e5c0a666f0a54fb","ref":"refs/heads/master","pushedAt":"2024-07-05T12:50:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update articles","shortMessageHtmlLink":"update articles"}},{"before":"ad49a01e23c87cff5194db72114a25f4d2eafd9e","after":"15c8b57316b08ad0bf3b967becfd523f42ee6814","ref":"refs/heads/master","pushedAt":"2024-07-04T15:04:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update","shortMessageHtmlLink":"update"}},{"before":"63b2196e801ad6713a8907dbdb088ced9318baf1","after":"ad49a01e23c87cff5194db72114a25f4d2eafd9e","ref":"refs/heads/master","pushedAt":"2024-07-04T10:12:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update cuda-mode lecture2","shortMessageHtmlLink":"update cuda-mode lecture2"}},{"before":"b487870b6715616f348b20d1f69f3955dc0001ad","after":"63b2196e801ad6713a8907dbdb088ced9318baf1","ref":"refs/heads/master","pushedAt":"2024-07-02T15:01:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"BBuf","name":"Xiaoyu Zhang","path":"/BBuf","primaryAvatarUrl":"https://github.com/avatars/u/35585791?s=80&v=4"},"commit":{"message":"update Lecture 2 Ch1-3 PMPP book.md","shortMessageHtmlLink":"update Lecture 2 Ch1-3 PMPP book.md"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAElVevEQA","startCursor":null,"endCursor":null}},"title":"Activity · BBuf/how-to-optim-algorithm-in-cuda"}