{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":599547518,"defaultBranch":"main","name":"vllm","ownerLogin":"vllm-project","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-02-09T11:23:20.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/136984999?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1716527147.0","currentOid":""},"activityList":{"items":[{"before":"e027eb6703ffaa5543f6a0ab2d12af737999eeb2","after":"b83f540a7fb78aaa9b20ab99b6e68fb70c2483be","ref":"refs/heads/disable-queue-size","pushedAt":"2024-05-24T21:42:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"fix tests","shortMessageHtmlLink":"fix tests"}},{"before":"13797c17038969cbdecf4086201e447957afe82f","after":"37efe98115fc7ec656a2d263914e1b7f29b36498","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T18:19:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"added test","shortMessageHtmlLink":"added test"}},{"before":"8225c3f1c26a4522ffb05b6f7652946f3ed86813","after":"13797c17038969cbdecf4086201e447957afe82f","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T18:18:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"added test and fixed requirements dev","shortMessageHtmlLink":"added test and fixed requirements dev"}},{"before":"b56352b6c202ccddd255cce3e06614c0a64f58a9","after":"8225c3f1c26a4522ffb05b6f7652946f3ed86813","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:52:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"format","shortMessageHtmlLink":"format"}},{"before":"034bbde9802ac6836245e3da8f8d9ffbe19759a8","after":"b56352b6c202ccddd255cce3e06614c0a64f58a9","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:23:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"updated models to remove sliding window. Big update to qwen to prevent non-uniform caching","shortMessageHtmlLink":"updated models to remove sliding window. Big update to qwen to preven…"}},{"before":"8a531804dbd2c6c13f0db3c8c81f9151934322e9","after":"034bbde9802ac6836245e3da8f8d9ffbe19759a8","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:10:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"removed from mixtral, need to fix qwen","shortMessageHtmlLink":"removed from mixtral, need to fix qwen"}},{"before":"919770957f26d71a5a6eda7a1a7443dfeb5ba0ee","after":"e64fde4b013cb8bb2321f59ba78aca50b02071cb","ref":"refs/heads/main","pushedAt":"2024-05-24T17:07:09.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"cadedaniel","name":"Cade Daniel","path":"/cadedaniel","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/950914?s=80&v=4"},"commit":{"message":"[Core][Bugfix]: fix prefix caching for blockv2 (#4764)\n\nCo-authored-by: Lei Wen ","shortMessageHtmlLink":"[Core][Bugfix]: fix prefix caching for blockv2 (#4764)"}},{"before":"1126c5aa81639a7e9ddc0b10ed4873765085b9dc","after":"8a531804dbd2c6c13f0db3c8c81f9151934322e9","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:05:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"9fd64fe79d2bd694dec0f078c6bcb0c7fa913734","after":"1126c5aa81639a7e9ddc0b10ed4873765085b9dc","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:03:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"a497b7b808bf55411f0c6e0dd85dfe3437ac2c93","after":"9fd64fe79d2bd694dec0f078c6bcb0c7fa913734","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:59:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"6f754c3b24e85b4ae095b82146e55e42361d3ff7","after":"a497b7b808bf55411f0c6e0dd85dfe3437ac2c93","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:58:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"cleanup prints and comments to match current for easier review","shortMessageHtmlLink":"cleanup prints and comments to match current for easier review"}},{"before":"3f73426a49140b2a351cd99abd9f55c053d5b14c","after":"6f754c3b24e85b4ae095b82146e55e42361d3ff7","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:54:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"stash","shortMessageHtmlLink":"stash"}},{"before":"4a3630c4afc4a1215c16466531cc2e96b6d8867c","after":"3f73426a49140b2a351cd99abd9f55c053d5b14c","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:42:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup","shortMessageHtmlLink":"more cleanup"}},{"before":"63c0097b51f21a059238dfc74e19f6caeead50ad","after":"4a3630c4afc4a1215c16466531cc2e96b6d8867c","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:40:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup","shortMessageHtmlLink":"more cleanup"}},{"before":"063896042b67d18a33141eaa2fa86d584e2f1164","after":"63c0097b51f21a059238dfc74e19f6caeead50ad","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:38:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"revert change to make PR easier to read","shortMessageHtmlLink":"revert change to make PR easier to read"}},{"before":"033c2c5ea1efce8cc2738d1502252f5e3d424de4","after":"063896042b67d18a33141eaa2fa86d584e2f1164","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:34:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"removed spurious changes","shortMessageHtmlLink":"removed spurious changes"}},{"before":"6a50f4cafaf9f734b3f6ad11e6af38838aa3baf8","after":"919770957f26d71a5a6eda7a1a7443dfeb5ba0ee","ref":"refs/heads/main","pushedAt":"2024-05-24T12:28:27.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Bugfix] Fix Mistral v0.3 Weight Loading (#5005)\n\nCo-authored-by: Cody Yu ","shortMessageHtmlLink":"[Bugfix] Fix Mistral v0.3 Weight Loading (#5005)"}},{"before":"c90a1b6612d30039f65147327c01b2b6a2657165","after":null,"ref":"refs/heads/update_ray_data_example","pushedAt":"2024-05-24T05:05:47.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"Yard1","name":"Antoni Baum","path":"/Yard1","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10364161?s=80&v=4"}},{"before":"e3470f87538ec86d1094ac4747519c6300213088","after":"6a50f4cafaf9f734b3f6ad11e6af38838aa3baf8","ref":"refs/heads/main","pushedAt":"2024-05-23T23:21:54.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"youkaichao","name":"youkaichao","path":"/youkaichao","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23236638?s=80&v=4"},"commit":{"message":"[Doc] add ccache guide in doc (#5012)\n\nCo-authored-by: Michael Goin ","shortMessageHtmlLink":"[Doc] add ccache guide in doc (#5012)"}},{"before":"a1242324c99ff8b1e29981006dfb504da198c7c3","after":"e3470f87538ec86d1094ac4747519c6300213088","ref":"refs/heads/main","pushedAt":"2024-05-23T22:04:24.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Core]: Option To Use Prompt Token Ids Inside Logits Processor (#4985)\n\nCo-authored-by: Elisei Smirnov ","shortMessageHtmlLink":"[Core]: Option To Use Prompt Token Ids Inside Logits Processor (#4985)"}},{"before":"5eda2ea02a01b2457f4d6ac2a217f2fa8a2e5d5f","after":"a1242324c99ff8b1e29981006dfb504da198c7c3","ref":"refs/heads/main","pushedAt":"2024-05-23T21:29:18.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Kernel] Initial Activation Quantization Support (#4525)\n\nCo-authored-by: Varun Sundar Rabindranath \r\nCo-authored-by: Varun Sundar Rabindranath ","shortMessageHtmlLink":"[Kernel] Initial Activation Quantization Support (#4525)"}},{"before":"adaccf8e5f6c5b86034b5e3234832debce57f04f","after":"e027eb6703ffaa5543f6a0ab2d12af737999eeb2","ref":"refs/heads/disable-queue-size","pushedAt":"2024-05-23T19:16:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"fix comments","shortMessageHtmlLink":"fix comments"}},{"before":"2ba80bed2732edf42b1014ea4e34757849fc93d0","after":"5eda2ea02a01b2457f4d6ac2a217f2fa8a2e5d5f","ref":"refs/heads/main","pushedAt":"2024-05-23T16:54:48.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"youkaichao","name":"youkaichao","path":"/youkaichao","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23236638?s=80&v=4"},"commit":{"message":"[Core][1/N] Support send/recv in PyNCCL Groups (#4988)\n\nSigned-off-by: Muralidhar Andoorveedu ","shortMessageHtmlLink":"[Core][1/N] Support send/recv in PyNCCL Groups (#4988)"}},{"before":"606625329648e6eff1883e23040adfad82f219cf","after":"2ba80bed2732edf42b1014ea4e34757849fc93d0","ref":"refs/heads/main","pushedAt":"2024-05-23T16:08:58.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Bugfix] Update Dockerfile.cpu to fix NameError: name 'vllm_ops' is not defined (#5009)","shortMessageHtmlLink":"[Bugfix] Update Dockerfile.cpu to fix NameError: name 'vllm_ops' is n…"}},{"before":"8efc774fb721d3a14fc32d2c2236f284da5d5fa0","after":"033c2c5ea1efce8cc2738d1502252f5e3d424de4","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-23T12:02:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"updated to remove sliding window usage in models","shortMessageHtmlLink":"updated to remove sliding window usage in models"}},{"before":"6620e534702f2e50dbc921d4c7323f99f895a015","after":"8efc774fb721d3a14fc32d2c2236f284da5d5fa0","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-23T11:34:31.000Z","pushType":"push","commitsCount":52,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"Merge branch 'main' into prefix-caching-guards-new","shortMessageHtmlLink":"Merge branch 'main' into prefix-caching-guards-new"}},{"before":"ee3eea0a1b2c690557455d97074d8829d5a98320","after":"adaccf8e5f6c5b86034b5e3234832debce57f04f","ref":"refs/heads/disable-queue-size","pushedAt":"2024-05-23T06:45:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"test and fix","shortMessageHtmlLink":"test and fix"}},{"before":null,"after":"ee3eea0a1b2c690557455d97074d8829d5a98320","ref":"refs/heads/disable-queue-size","pushedAt":"2024-05-23T06:44:28.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"[Misc] Take user preference in attention selector (#4960)","shortMessageHtmlLink":"[Misc] Take user preference in attention selector (#4960)"}},{"before":"ee3eea0a1b2c690557455d97074d8829d5a98320","after":"606625329648e6eff1883e23040adfad82f219cf","ref":"refs/heads/main","pushedAt":"2024-05-23T06:39:28.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"mgoin","name":"Michael Goin","path":"/mgoin","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/3195154?s=80&v=4"},"commit":{"message":"Marlin 24 prefill performance improvement (about 25% better on average) (#4983)","shortMessageHtmlLink":"Marlin 24 prefill performance improvement (about 25% better on averag…"}},{"before":"a36de682d4283c60777bc3022ed3ce71cd90b904","after":"ee3eea0a1b2c690557455d97074d8829d5a98320","ref":"refs/heads/main","pushedAt":"2024-05-22T22:55:56.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"rkooo567","name":"SangBin Cho","path":"/rkooo567","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/18510752?s=80&v=4"},"commit":{"message":"[Misc] Take user preference in attention selector (#4960)","shortMessageHtmlLink":"[Misc] Take user preference in attention selector (#4960)"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEU2xtoQA","startCursor":null,"endCursor":null}},"title":"Activity · vllm-project/vllm"}