{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":599547518,"defaultBranch":"main","name":"vllm","ownerLogin":"vllm-project","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-02-09T11:23:20.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/136984999?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1716851636.0","currentOid":""},"activityList":{"items":[{"before":"890aa93d275a2b75313629614ab9ed278a13f6d7","after":"d4f398590786f0015d474b03a3d078db1e7d1be2","ref":"refs/heads/main","pushedAt":"2024-05-28T02:07:07.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"rkooo567","name":"SangBin Cho","path":"/rkooo567","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/18510752?s=80&v=4"},"commit":{"message":"[Core] Sliding window for block manager v2 (#4545)\n\nCo-authored-by: Ruth Evans ","shortMessageHtmlLink":"[Core] Sliding window for block manager v2 (#4545)"}},{"before":"fbdb7b3ee2c3f7b58841c12b52ed4c83f508babb","after":"890aa93d275a2b75313629614ab9ed278a13f6d7","ref":"refs/heads/main","pushedAt":"2024-05-27T23:41:43.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[Model] Add support for falcon-11B (#5069)","shortMessageHtmlLink":"[Model] Add support for falcon-11B (#5069)"}},{"before":"fbdb7b3ee2c3f7b58841c12b52ed4c83f508babb","after":"799147a4876bbef10471a007751f9ee9dadc484c","ref":"refs/heads/fix-embedding-with-tp","pushedAt":"2024-05-27T23:24:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"fix embedding model + tp","shortMessageHtmlLink":"fix embedding model + tp"}},{"before":null,"after":"fbdb7b3ee2c3f7b58841c12b52ed4c83f508babb","ref":"refs/heads/fix-embedding-with-tp","pushedAt":"2024-05-27T23:13:56.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Core] Allow AQLM on Pascal (#5058)","shortMessageHtmlLink":"[Core] Allow AQLM on Pascal (#5058)"}},{"before":"1102bef2195a102c6a5489a28329e543a600b4d8","after":"fbdb7b3ee2c3f7b58841c12b52ed4c83f508babb","ref":"refs/heads/main","pushedAt":"2024-05-27T22:26:14.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"[Core] Allow AQLM on Pascal (#5058)","shortMessageHtmlLink":"[Core] Allow AQLM on Pascal (#5058)"}},{"before":"f17a1a8f9665bb237a3dddda7dc93f259e5e81e0","after":"1102bef2195a102c6a5489a28329e543a600b4d8","ref":"refs/heads/main","pushedAt":"2024-05-27T22:18:17.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"zhuohan123","name":"Zhuohan Li","path":"/zhuohan123","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/17310766?s=80&v=4"},"commit":{"message":"[Bugfix / Core] Prefix Caching Guards (merged with main) (#4846)\n\nCo-authored-by: rsnm2 \r\nCo-authored-by: Robert Shaw <114415538+robertgshaw2-neuralmagic@users.noreply.github.com>","shortMessageHtmlLink":"[Bugfix / Core] Prefix Caching Guards (merged with main) (#4846)"}},{"before":"84253fdea362b454b7213fbd45e9812b4b6ed882","after":"7a61f51a9592e88f951edeb989b415d27b820d69","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T17:53:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"Update test_disable_sliding_window.py","shortMessageHtmlLink":"Update test_disable_sliding_window.py"}},{"before":"4285763fdebbd19bb40a13f3840651a392cb86e8","after":"84253fdea362b454b7213fbd45e9812b4b6ed882","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T16:53:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"fixed logging","shortMessageHtmlLink":"fixed logging"}},{"before":"7c8a9d0592c76e2d3e549eee44f59ff7414fd041","after":"4285763fdebbd19bb40a13f3840651a392cb86e8","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T16:46:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"format","shortMessageHtmlLink":"format"}},{"before":"93bce3774dc58cab359a7f5858fc0b3841ec839b","after":"7c8a9d0592c76e2d3e549eee44f59ff7414fd041","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T16:45:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"updated test","shortMessageHtmlLink":"updated test"}},{"before":"7b186c23867c05622394f6aee22458e65c49c804","after":"93bce3774dc58cab359a7f5858fc0b3841ec839b","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T16:16:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"updated comment","shortMessageHtmlLink":"updated comment"}},{"before":"37efe98115fc7ec656a2d263914e1b7f29b36498","after":"7b186c23867c05622394f6aee22458e65c49c804","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-27T16:14:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"format","shortMessageHtmlLink":"format"}},{"before":"d5a16977729928a2ceafb5ec8764081f40f7cdff","after":"f17a1a8f9665bb237a3dddda7dc93f259e5e81e0","ref":"refs/heads/main","pushedAt":"2024-05-25T17:28:16.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"ywang96","name":"Roger Wang","path":"/ywang96","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/136131678?s=80&v=4"},"commit":{"message":"[Misc] Make Serving Benchmark More User-friendly (#5044)","shortMessageHtmlLink":"[Misc] Make Serving Benchmark More User-friendly (#5044)"}},{"before":"325c119961698c27d8d11d61d019a6d57c814c51","after":"d5a16977729928a2ceafb5ec8764081f40f7cdff","ref":"refs/heads/main","pushedAt":"2024-05-25T17:00:14.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Dynamic Spec Decoding] Minor fix for disabling speculative decoding (#5000)","shortMessageHtmlLink":"[Dynamic Spec Decoding] Minor fix for disabling speculative decoding (#…"}},{"before":"8e192ff967b44b186ea02d30e49fddf656fdfe50","after":"325c119961698c27d8d11d61d019a6d57c814c51","ref":"refs/heads/main","pushedAt":"2024-05-25T06:49:49.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"youkaichao","name":"youkaichao","path":"/youkaichao","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/23236638?s=80&v=4"},"commit":{"message":"[Misc] add logging level env var (#5045)","shortMessageHtmlLink":"[Misc] add logging level env var (#5045)"}},{"before":"e64fde4b013cb8bb2321f59ba78aca50b02071cb","after":"8e192ff967b44b186ea02d30e49fddf656fdfe50","ref":"refs/heads/main","pushedAt":"2024-05-25T05:00:52.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Kernel][Backend][Model] Blocksparse flash attention kernel and Phi-3-Small model (#4799)\n\nCo-authored-by: beagleski \r\nCo-authored-by: bapatra \r\nCo-authored-by: Barun Patra \r\nCo-authored-by: Michael Goin ","shortMessageHtmlLink":"[Kernel][Backend][Model] Blocksparse flash attention kernel and Phi-3…"}},{"before":"e027eb6703ffaa5543f6a0ab2d12af737999eeb2","after":"b83f540a7fb78aaa9b20ab99b6e68fb70c2483be","ref":"refs/heads/disable-queue-size","pushedAt":"2024-05-24T21:42:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"LiuXiaoxuanPKU","name":"Lily Liu","path":"/LiuXiaoxuanPKU","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/16137495?s=80&v=4"},"commit":{"message":"fix tests","shortMessageHtmlLink":"fix tests"}},{"before":"13797c17038969cbdecf4086201e447957afe82f","after":"37efe98115fc7ec656a2d263914e1b7f29b36498","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T18:19:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"added test","shortMessageHtmlLink":"added test"}},{"before":"8225c3f1c26a4522ffb05b6f7652946f3ed86813","after":"13797c17038969cbdecf4086201e447957afe82f","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T18:18:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"added test and fixed requirements dev","shortMessageHtmlLink":"added test and fixed requirements dev"}},{"before":"b56352b6c202ccddd255cce3e06614c0a64f58a9","after":"8225c3f1c26a4522ffb05b6f7652946f3ed86813","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:52:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"format","shortMessageHtmlLink":"format"}},{"before":"034bbde9802ac6836245e3da8f8d9ffbe19759a8","after":"b56352b6c202ccddd255cce3e06614c0a64f58a9","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:23:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"updated models to remove sliding window. Big update to qwen to prevent non-uniform caching","shortMessageHtmlLink":"updated models to remove sliding window. Big update to qwen to preven…"}},{"before":"8a531804dbd2c6c13f0db3c8c81f9151934322e9","after":"034bbde9802ac6836245e3da8f8d9ffbe19759a8","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:10:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"removed from mixtral, need to fix qwen","shortMessageHtmlLink":"removed from mixtral, need to fix qwen"}},{"before":"919770957f26d71a5a6eda7a1a7443dfeb5ba0ee","after":"e64fde4b013cb8bb2321f59ba78aca50b02071cb","ref":"refs/heads/main","pushedAt":"2024-05-24T17:07:09.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"cadedaniel","name":"Cade Daniel","path":"/cadedaniel","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/950914?s=80&v=4"},"commit":{"message":"[Core][Bugfix]: fix prefix caching for blockv2 (#4764)\n\nCo-authored-by: Lei Wen ","shortMessageHtmlLink":"[Core][Bugfix]: fix prefix caching for blockv2 (#4764)"}},{"before":"1126c5aa81639a7e9ddc0b10ed4873765085b9dc","after":"8a531804dbd2c6c13f0db3c8c81f9151934322e9","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:05:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"9fd64fe79d2bd694dec0f078c6bcb0c7fa913734","after":"1126c5aa81639a7e9ddc0b10ed4873765085b9dc","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T17:03:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"a497b7b808bf55411f0c6e0dd85dfe3437ac2c93","after":"9fd64fe79d2bd694dec0f078c6bcb0c7fa913734","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:59:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup for PR readibility","shortMessageHtmlLink":"more cleanup for PR readibility"}},{"before":"6f754c3b24e85b4ae095b82146e55e42361d3ff7","after":"a497b7b808bf55411f0c6e0dd85dfe3437ac2c93","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:58:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"cleanup prints and comments to match current for easier review","shortMessageHtmlLink":"cleanup prints and comments to match current for easier review"}},{"before":"3f73426a49140b2a351cd99abd9f55c053d5b14c","after":"6f754c3b24e85b4ae095b82146e55e42361d3ff7","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:54:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"stash","shortMessageHtmlLink":"stash"}},{"before":"4a3630c4afc4a1215c16466531cc2e96b6d8867c","after":"3f73426a49140b2a351cd99abd9f55c053d5b14c","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:42:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup","shortMessageHtmlLink":"more cleanup"}},{"before":"63c0097b51f21a059238dfc74e19f6caeead50ad","after":"4a3630c4afc4a1215c16466531cc2e96b6d8867c","ref":"refs/heads/prefix-caching-guards-new","pushedAt":"2024-05-24T16:40:25.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"robertgshaw2-neuralmagic","name":"Robert Shaw","path":"/robertgshaw2-neuralmagic","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/114415538?s=80&v=4"},"commit":{"message":"more cleanup","shortMessageHtmlLink":"more cleanup"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEVVxBeQA","startCursor":null,"endCursor":null}},"title":"Activity · vllm-project/vllm"}