{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":731842419,"defaultBranch":"main","name":"PowerInfer","ownerLogin":"SJTU-IPADS","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-12-15T02:24:10.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/10797537?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1712629852.0","currentOid":""},"activityList":{"items":[{"before":"906830b3c6f2c10d0ee2291b7f7d65f4ca930b74","after":"3f638f7ba07915310d7e97a957ebb6737d504414","ref":"refs/heads/main","pushedAt":"2024-05-20T05:27:36.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"Support AMD ROCm(#187)\n\n* Q4_Update\r\n\r\n* AMD_Support\r\n\r\n* competition\r\n\r\n* competition_add\r\n\r\n* Delete test.sh\r\n\r\n* Update README.md\r\n\r\n* Update ggml-cuda.cu\r\n\r\nCo-authored-by: Holden X \r\n\r\n* Update ggml-cuda.cu\r\n\r\nCo-authored-by: Holden X \r\n\r\n* AMD_Support_1\r\n\r\n---------\r\n\r\nCo-authored-by: Holden X ","shortMessageHtmlLink":"Support AMD ROCm(#187)"}},{"before":"10a006bd5272634e8f3a99a40dc4db742433834d","after":"a915f9a5898a9188d6df5aef15e7b632e8041eeb","ref":"refs/heads/fix/vram-budget-inaccuracy","pushedAt":"2024-04-29T11:08:46.000Z","pushType":"push","commitsCount":8,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"wip","shortMessageHtmlLink":"wip"}},{"before":"906830b3c6f2c10d0ee2291b7f7d65f4ca930b74","after":"10a006bd5272634e8f3a99a40dc4db742433834d","ref":"refs/heads/fix/vram-budget-inaccuracy","pushedAt":"2024-04-12T01:57:49.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"wip alloc tensor weights after first graph built","shortMessageHtmlLink":"wip alloc tensor weights after first graph built"}},{"before":null,"after":"906830b3c6f2c10d0ee2291b7f7d65f4ca930b74","ref":"refs/heads/fix/vram-budget-inaccuracy","pushedAt":"2024-04-09T02:30:52.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix: offload ffn norm weights (#179)","shortMessageHtmlLink":"fix: offload ffn norm weights (#179)"}},{"before":"3d90d1f7be75c704c80387db6d7d8922cb7ba4d1","after":"09d79ec0ac0c1d494cdf535504c6712294c359c1","ref":"refs/heads/feat-moe","pushedAt":"2024-04-09T02:30:19.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"minimal impl. of gpu_idx generation for moe model","shortMessageHtmlLink":"minimal impl. of gpu_idx generation for moe model"}},{"before":"0e834efb19df7b9f7b365b94c873854a8e287a23","after":"3d90d1f7be75c704c80387db6d7d8922cb7ba4d1","ref":"refs/heads/feat-moe","pushedAt":"2024-04-07T08:48:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"offload qwen2moe to gpu","shortMessageHtmlLink":"offload qwen2moe to gpu"}},{"before":"b478398c589928b1bd883e5a827882579873d250","after":"906830b3c6f2c10d0ee2291b7f7d65f4ca930b74","ref":"refs/heads/main","pushedAt":"2024-04-07T02:33:23.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"fix: offload ffn norm weights (#179)","shortMessageHtmlLink":"fix: offload ffn norm weights (#179)"}},{"before":null,"after":"38ce80a2a7de029a55ad9095cb51e2c2ed88ec16","ref":"refs/heads/fix/offload-ffn-norm","pushedAt":"2024-04-07T02:30:20.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix: offload ffn norm weights","shortMessageHtmlLink":"fix: offload ffn norm weights"}},{"before":"c605934b7de120e8ba7381f91953d72fb3c77810","after":"0e834efb19df7b9f7b365b94c873854a8e287a23","ref":"refs/heads/feat-moe","pushedAt":"2024-04-03T14:56:31.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"CPU run correctly","shortMessageHtmlLink":"CPU run correctly"}},{"before":"0183bcef8999d5e713ec66cfe8f3e6405236b546","after":"c605934b7de120e8ba7381f91953d72fb3c77810","ref":"refs/heads/feat-moe","pushedAt":"2024-04-03T14:51:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"WIP:support qwen2","shortMessageHtmlLink":"WIP:support qwen2"}},{"before":"eb45354a656ba4f3b8b3cc14dada7348a9a5ac0e","after":"0183bcef8999d5e713ec66cfe8f3e6405236b546","ref":"refs/heads/feat-moe","pushedAt":"2024-04-03T13:41:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"fix cpu bugs","shortMessageHtmlLink":"fix cpu bugs"}},{"before":"db0977955316f91db6dc7e03af600b81342a63f2","after":"eb45354a656ba4f3b8b3cc14dada7348a9a5ac0e","ref":"refs/heads/feat-moe","pushedAt":"2024-04-02T17:39:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"minor: code clearnup","shortMessageHtmlLink":"minor: code clearnup"}},{"before":"54e5482a9c61d34dc1775d1ab175b84bc99ca8fa","after":"db0977955316f91db6dc7e03af600b81342a63f2","ref":"refs/heads/feat-moe","pushedAt":"2024-04-02T17:34:12.000Z","pushType":"push","commitsCount":10,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix: bugs in new ffn spliting","shortMessageHtmlLink":"fix: bugs in new ffn spliting"}},{"before":"0c051b064c282494c37ad175735619ba1fbe7c80","after":null,"ref":"refs/heads/fix/sparse-ffn-seq","pushedAt":"2024-04-02T06:35:52.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"}},{"before":"fb91425f3a77f5aa6d9b642d17952f9a9bfbf733","after":null,"ref":"refs/heads/fix/axpy-dense","pushedAt":"2024-04-02T06:35:52.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"}},{"before":"c8e15df7267f7b3b55e47ddf3fb995733e01ba0c","after":"b478398c589928b1bd883e5a827882579873d250","ref":"refs/heads/main","pushedAt":"2024-04-02T06:35:08.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"Remove axpy dense op (#177)","shortMessageHtmlLink":"Remove axpy dense op (#177)"}},{"before":"b25cb86b0ba9b72af8bf6900a869f7238e876e1d","after":"c8e15df7267f7b3b55e47ddf3fb995733e01ba0c","ref":"refs/heads/main","pushedAt":"2024-04-02T06:34:23.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"hotfix: failed to build ffn with LLM_GATE_SEQ (#178)","shortMessageHtmlLink":"hotfix: failed to build ffn with LLM_GATE_SEQ (#178)"}},{"before":null,"after":"0c051b064c282494c37ad175735619ba1fbe7c80","ref":"refs/heads/fix/sparse-ffn-seq","pushedAt":"2024-04-02T06:25:22.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"hotfix: failed to build ffn with LLM_GATE_SEQ","shortMessageHtmlLink":"hotfix: failed to build ffn with LLM_GATE_SEQ"}},{"before":null,"after":"fb91425f3a77f5aa6d9b642d17952f9a9bfbf733","ref":"refs/heads/fix/axpy-dense","pushedAt":"2024-04-02T04:54:44.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"Remove axpy dense op","shortMessageHtmlLink":"Remove axpy dense op"}},{"before":null,"after":"54e5482a9c61d34dc1775d1ab175b84bc99ca8fa","ref":"refs/heads/feat-moe","pushedAt":"2024-04-01T17:42:15.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix merge faults and compatibility issues","shortMessageHtmlLink":"fix merge faults and compatibility issues"}},{"before":"c3d2968cf9ffd4cabe48319299112068105f12f0","after":"84c334512e904ac7a2c8c63696c5a4cdf083b7dd","ref":"refs/heads/moe-dense","pushedAt":"2024-04-01T02:17:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"fix computation graph","shortMessageHtmlLink":"fix computation graph"}},{"before":"c2ab47db98366b1573202275b06aa8fe4473a3fd","after":"c3d2968cf9ffd4cabe48319299112068105f12f0","ref":"refs/heads/moe-dense","pushedAt":"2024-03-31T18:31:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix: tensor dim","shortMessageHtmlLink":"fix: tensor dim"}},{"before":null,"after":"c2ab47db98366b1573202275b06aa8fe4473a3fd","ref":"refs/heads/moe-dense","pushedAt":"2024-03-31T18:24:03.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix: model loading for dense moe","shortMessageHtmlLink":"fix: model loading for dense moe"}},{"before":"e1002f613564b025311a53214d3fc61177fe36ea","after":"4f126960dbe6a036c267d2203e78653f5473aa80","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T15:42:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"hodlen","name":"Holden X","path":"/hodlen","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34213478?s=80&v=4"},"commit":{"message":"fix syntax error","shortMessageHtmlLink":"fix syntax error"}},{"before":"e2b668dec8599716a2906804cd880d2312df0a5e","after":"e1002f613564b025311a53214d3fc61177fe36ea","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T11:10:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"minor","shortMessageHtmlLink":"minor"}},{"before":"7a04b460518cbe9ec105dacdfb07e8c0884d6507","after":"e2b668dec8599716a2906804cd880d2312df0a5e","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T10:21:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"minor","shortMessageHtmlLink":"minor"}},{"before":"86f66617cdff29b1b10a0cb483576a44e1f2c8c6","after":"7a04b460518cbe9ec105dacdfb07e8c0884d6507","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T10:10:43.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"q5_1 support","shortMessageHtmlLink":"q5_1 support"}},{"before":"1848cc29d43e30404c03c63831dbdb8958730419","after":"86f66617cdff29b1b10a0cb483576a44e1f2c8c6","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T09:37:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"q5 support","shortMessageHtmlLink":"q5 support"}},{"before":"450d36f2be460e77f9876673c722125c25bbca76","after":"1848cc29d43e30404c03c63831dbdb8958730419","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T08:43:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"support q5_0 for cpu","shortMessageHtmlLink":"support q5_0 for cpu"}},{"before":"d7c074ea2b3ddb1725bc6d63b848ff53391594e9","after":"450d36f2be460e77f9876673c722125c25bbca76","ref":"refs/heads/quantize-support","pushedAt":"2024-03-31T08:16:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"YixinSong-e","name":"Jeremy Song","path":"/YixinSong-e","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/76689794?s=80&v=4"},"commit":{"message":"support q4_1","shortMessageHtmlLink":"support q4_1"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAETnEYeAA","startCursor":null,"endCursor":null}},"title":"Activity ยท SJTU-IPADS/PowerInfer"}