{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":599547518,"defaultBranch":"main","name":"vllm","ownerLogin":"vllm-project","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-02-09T11:23:20.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/136984999?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1717286493.0","currentOid":""},"activityList":{"items":[{"before":"f790ad3c50f050778af1fd31170746b7c68ca2fc","after":"a66cf40b205d57ac1b5dc96b6bb6f8e813b18316","ref":"refs/heads/main","pushedAt":"2024-06-02T21:13:26.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"pcmoritz","name":"Philipp Moritz","path":"/pcmoritz","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/113316?s=80&v=4"},"commit":{"message":"[Kernel][ROCm][AMD] enable fused topk_softmax kernel for moe layer (#4927)\n\nThis PR enables the fused topk_softmax kernel used in moe layer for HIP","shortMessageHtmlLink":"[Kernel][ROCm][AMD] enable fused topk_softmax kernel for moe layer (#…"}},{"before":"ed59a7ed23c6e91096ea82b03037e40b14b5375c","after":"f790ad3c50f050778af1fd31170746b7c68ca2fc","ref":"refs/heads/main","pushedAt":"2024-06-02T08:06:13.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"[Frontend][OpenAI] Support for returning max_model_len on /v1/models response (#4643)","shortMessageHtmlLink":"[Frontend][OpenAI] Support for returning max_model_len on /v1/models …"}},{"before":"044793d8df6aeb5326b5992d0e60aa4457760e8a","after":"ed59a7ed23c6e91096ea82b03037e40b14b5375c","ref":"refs/heads/main","pushedAt":"2024-06-02T02:21:53.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"Update test_ignore_eos (#4898)","shortMessageHtmlLink":"Update test_ignore_eos (#4898)"}},{"before":"996cf2de5cf7bc5aa7ab452c02ecda50e2d0cdcc","after":"1936d7bab00332047c444f04b7c01276e33cb8bb","ref":"refs/heads/fix-hashing-partial-blocks","pushedAt":"2024-06-02T00:02:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"format","shortMessageHtmlLink":"format"}},{"before":null,"after":"996cf2de5cf7bc5aa7ab452c02ecda50e2d0cdcc","ref":"refs/heads/fix-hashing-partial-blocks","pushedAt":"2024-06-02T00:01:33.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"Fix hashing logic for non-full blocks","shortMessageHtmlLink":"Fix hashing logic for non-full blocks"}},{"before":"c2d6d2f960176491e0499656409f30b947ee8027","after":"044793d8df6aeb5326b5992d0e60aa4457760e8a","ref":"refs/heads/main","pushedAt":"2024-06-01T23:35:41.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"mgoin","name":"Michael Goin","path":"/mgoin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/3195154?s=80&v=4"},"commit":{"message":"[BugFix] Prevent `LLM.encode` for non-generation Models (#5184)\n\nCo-authored-by: mgoin ","shortMessageHtmlLink":"[BugFix] Prevent LLM.encode for non-generation Models (#5184)"}},{"before":"8279078e218833b357f7c5076850e3688714d570","after":"c2d6d2f960176491e0499656409f30b947ee8027","ref":"refs/heads/main","pushedAt":"2024-06-01T22:53:52.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[Bugfix]: Fix issues related to prefix caching example (#5177) (#5180)","shortMessageHtmlLink":"[Bugfix]: Fix issues related to prefix caching example (#5177) (#5180)"}},{"before":"b9c0605a8e7d558f595bd59ba6e6c95578dc0f1e","after":"8279078e218833b357f7c5076850e3688714d570","ref":"refs/heads/main","pushedAt":"2024-06-01T22:40:25.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[Bugfix] Remove deprecated @abstractproperty (#5174)","shortMessageHtmlLink":"[Bugfix] Remove deprecated @abstractproperty (#5174)"}},{"before":"37464a0f745a0204da7443d2a6ef4b8f65e5af12","after":"b9c0605a8e7d558f595bd59ba6e6c95578dc0f1e","ref":"refs/heads/main","pushedAt":"2024-06-01T20:51:11.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"mgoin","name":"Michael Goin","path":"/mgoin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/3195154?s=80&v=4"},"commit":{"message":"[Feature][Kernel] Support bitsandbytes quantization and QLoRA (#4776)","shortMessageHtmlLink":"[Feature][Kernel] Support bitsandbytes quantization and QLoRA (#4776)"}},{"before":"c35407282878cb3a42860d584a4d9eb6aed82299","after":"37464a0f745a0204da7443d2a6ef4b8f65e5af12","ref":"refs/heads/main","pushedAt":"2024-06-01T17:18:50.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"[Bugfix] Fix call to init_logger in openai server (#4765)","shortMessageHtmlLink":"[Bugfix] Fix call to init_logger in openai server (#4765)"}},{"before":"f081c3ce4b020fb094e33575d178345c477ab0c6","after":"c35407282878cb3a42860d584a4d9eb6aed82299","ref":"refs/heads/main","pushedAt":"2024-06-01T17:11:22.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"[Minor] Fix the path typo in loader.py: save_sharded_states.py -> save_sharded_state.py (#5151)\n\nSigned-off-by: Ye Cao ","shortMessageHtmlLink":"[Minor] Fix the path typo in loader.py: save_sharded_states.py -> sav…"}},{"before":"260d119e864edbf023b1be7fa446a08bbea11f80","after":"f081c3ce4b020fb094e33575d178345c477ab0c6","ref":"refs/heads/main","pushedAt":"2024-06-01T08:46:07.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Kernel] Update Cutlass fp8 configs (#5144)\n\nCo-authored-by: Varun Sundar Rabindranath \r\nCo-authored-by: Robert Shaw <114415538+robertgshaw2-neuralmagic@users.noreply.github.com>","shortMessageHtmlLink":"[Kernel] Update Cutlass fp8 configs (#5144)"}},{"before":"9acace88ac2ed07dc8b680e1e71494945cb8c957","after":"2c6462c1bbe9331b1ec2a5c97e932e1bce2b0c41","ref":"refs/heads/remove-abstract-property","pushedAt":"2024-06-01T07:41:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"fix import","shortMessageHtmlLink":"fix import"}},{"before":"7d1d09e459f365ddaa3b054cca5d83bf1c941008","after":"9acace88ac2ed07dc8b680e1e71494945cb8c957","ref":"refs/heads/remove-abstract-property","pushedAt":"2024-06-01T07:20:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"fix","shortMessageHtmlLink":"fix"}},{"before":"a360ff80bb34f9dfcd21cf880c2030daa2d6b3a3","after":"7d1d09e459f365ddaa3b054cca5d83bf1c941008","ref":"refs/heads/remove-abstract-property","pushedAt":"2024-06-01T07:19:54.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"Remove deprecated @abstractproperty","shortMessageHtmlLink":"Remove deprecated @abstractproperty"}},{"before":null,"after":"a360ff80bb34f9dfcd21cf880c2030daa2d6b3a3","ref":"refs/heads/remove-abstract-property","pushedAt":"2024-06-01T07:19:14.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[CI/Build] CMakeLists: build all extensions' cmake targets at the same time (#5034)","shortMessageHtmlLink":"[CI/Build] CMakeLists: build all extensions' cmake targets at the sam…"}},{"before":"a360ff80bb34f9dfcd21cf880c2030daa2d6b3a3","after":"260d119e864edbf023b1be7fa446a08bbea11f80","ref":"refs/heads/main","pushedAt":"2024-06-01T06:45:32.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Kernel] Refactor CUTLASS kernels to always take scales that reside on the GPU (#5137)","shortMessageHtmlLink":"[Kernel] Refactor CUTLASS kernels to always take scales that reside o…"}},{"before":"1197e02141df1a7442f21ff6922c98ec0bba153e","after":"a360ff80bb34f9dfcd21cf880c2030daa2d6b3a3","ref":"refs/heads/main","pushedAt":"2024-06-01T04:06:45.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"mgoin","name":"Michael Goin","path":"/mgoin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/3195154?s=80&v=4"},"commit":{"message":"[CI/Build] CMakeLists: build all extensions' cmake targets at the same time (#5034)","shortMessageHtmlLink":"[CI/Build] CMakeLists: build all extensions' cmake targets at the sam…"}},{"before":"402b9478d3177b980ce638a4b80be4347501ceee","after":null,"ref":"refs/heads/gpt-bigcode-lora-doc","pushedAt":"2024-06-01T00:33:34.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"njhill","name":"Nick Hill","path":"/njhill","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16958488?s=80&v=4"}},{"before":"657579113f714c2e74bca373ecfb6c2c245b4101","after":"1197e02141df1a7442f21ff6922c98ec0bba153e","ref":"refs/heads/main","pushedAt":"2024-06-01T00:21:39.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Build] Guard against older CUDA versions when building CUTLASS 3.x kernels (#5168)","shortMessageHtmlLink":"[Build] Guard against older CUDA versions when building CUTLASS 3.x k…"}},{"before":"e9899fb7a4d9e032198d26ef84f1dd2cfd9621aa","after":"657579113f714c2e74bca373ecfb6c2c245b4101","ref":"refs/heads/main","pushedAt":"2024-06-01T00:20:19.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Doc] Add checkmark for GPTBigCodeForCausalLM LoRA support (#5171)","shortMessageHtmlLink":"[Doc] Add checkmark for GPTBigCodeForCausalLM LoRA support (#5171)"}},{"before":null,"after":"402b9478d3177b980ce638a4b80be4347501ceee","ref":"refs/heads/gpt-bigcode-lora-doc","pushedAt":"2024-05-31T23:52:04.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"njhill","name":"Nick Hill","path":"/njhill","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16958488?s=80&v=4"},"commit":{"message":"[Doc] Add checkmark for GPTBigCodeForCausalLM LoRA support\n\nThis was recently added in https://github.com/vllm-project/vllm/pull/3949 but we forgot to update the doc.","shortMessageHtmlLink":"[Doc] Add checkmark for GPTBigCodeForCausalLM LoRA support"}},{"before":"a377f0bd5e1fa0ca069e3dbf28f4de5af64d0bb1","after":"e9899fb7a4d9e032198d26ef84f1dd2cfd9621aa","ref":"refs/heads/main","pushedAt":"2024-05-31T21:29:20.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"[Model] Enable FP8 QKV in MoE and refine kernel tuning script (#5039)","shortMessageHtmlLink":"[Model] Enable FP8 QKV in MoE and refine kernel tuning script (#5039)"}},{"before":"e9d3aa04f6e55e2bb540f0810da97ddd0deebb13","after":"a377f0bd5e1fa0ca069e3dbf28f4de5af64d0bb1","ref":"refs/heads/main","pushedAt":"2024-05-31T05:14:50.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"[Misc]: optimize eager mode host time (#4196)\n\nCo-authored-by: xuhao ","shortMessageHtmlLink":"[Misc]: optimize eager mode host time (#4196)"}},{"before":"a22dea54d3e80bf069cfeed8002a193ef8b18e1b","after":"e9d3aa04f6e55e2bb540f0810da97ddd0deebb13","ref":"refs/heads/main","pushedAt":"2024-05-31T05:00:26.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"Revert \"[Kernel] Marlin_24: Ensure the mma.sp instruction is using the ::ordered_metadata modifier (introduced with PTX 8.5)\" (#5149)","shortMessageHtmlLink":"Revert \"[Kernel] Marlin_24: Ensure the mma.sp instruction is using th…"}},{"before":"8ea8c2cb18ae287e8e56ca84953117902a3fb9be","after":"090441f252a8a229b5be26b1434acfef1006040b","ref":"refs/heads/simon-mo/test-ignore-eos","pushedAt":"2024-05-31T04:56:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"Apply formatter","shortMessageHtmlLink":"Apply formatter"}},{"before":"db69a73280cd8c1cbd36e2fc01af0ef668339719","after":"8ea8c2cb18ae287e8e56ca84953117902a3fb9be","ref":"refs/heads/simon-mo/test-ignore-eos","pushedAt":"2024-05-31T04:55:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"DarkLight1337","name":"Cyrus Leung","path":"/DarkLight1337","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/44970335?s=80&v=4"},"commit":{"message":"Fix linter error","shortMessageHtmlLink":"Fix linter error"}},{"before":null,"after":"80a9c0d49786a446455ad6474c01742cf87dbbdd","ref":"refs/heads/revert-5136-marlin_24_ptx_ordered_metadata","pushedAt":"2024-05-31T04:27:40.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"Revert \"[Kernel] Marlin_24: Ensure the mma.sp instruction is using the ::orde…\"\n\nThis reverts commit 6d21fa1cadf1e623e302eb04c15e4927febc8cf1.","shortMessageHtmlLink":"Revert \"[Kernel] Marlin_24: Ensure the mma.sp instruction is using th…"}},{"before":"533c2177925ba19934eab0095a50d0a783185e6b","after":"a22dea54d3e80bf069cfeed8002a193ef8b18e1b","ref":"refs/heads/main","pushedAt":"2024-05-31T02:24:41.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[Model] Support MAP-NEO model (#5081)\n\nCo-authored-by: Zhuohan Li ","shortMessageHtmlLink":"[Model] Support MAP-NEO model (#5081)"}},{"before":"6d21fa1cadf1e623e302eb04c15e4927febc8cf1","after":"533c2177925ba19934eab0095a50d0a783185e6b","ref":"refs/heads/main","pushedAt":"2024-05-31T02:13:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"Fix cutlass sm_90a vesrion in CMakeList","shortMessageHtmlLink":"Fix cutlass sm_90a vesrion in CMakeList"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEWluYxgA","startCursor":null,"endCursor":null}},"title":"Activity · vllm-project/vllm"}