{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":599547518,"defaultBranch":"main","name":"vllm","ownerLogin":"vllm-project","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-02-09T11:23:20.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/136984999?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1717617146.0","currentOid":""},"activityList":{"items":[{"before":"6475b54a5bbeb6b68f3cff68cce1cca110e4d476","after":"908470c3c564b0cc95754a81f604d99fb66cfeba","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T23:50:50.000Z","pushType":"push","commitsCount":3,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"yapf","shortMessageHtmlLink":"yapf"}},{"before":"3a6ae1d33c7a8ef28b6dfa978f53b4fdcdbaaca6","after":"7b0a0dfb22907505441f8a4a5eb882cbca4d2acf","ref":"refs/heads/main","pushedAt":"2024-06-05T23:49:12.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Frontend][Core] Update Outlines Integration from `FSM` to `Guide` (#4109)\n\nCo-authored-by: Simon Mo \r\nCo-authored-by: Breno Faria ","shortMessageHtmlLink":"[Frontend][Core] Update Outlines Integration from FSM to Guide (#…"}},{"before":"8f1729b829795c2c98152fef8857c5e7b8c4e648","after":"3a6ae1d33c7a8ef28b6dfa978f53b4fdcdbaaca6","ref":"refs/heads/main","pushedAt":"2024-06-05T22:49:27.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[CI] Disable flash_attn backend for spec decode (#5286)","shortMessageHtmlLink":"[CI] Disable flash_attn backend for spec decode (#5286)"}},{"before":"6a7c7711a2588ca4a5e713e5335122988f8c0a55","after":"8f1729b829795c2c98152fef8857c5e7b8c4e648","ref":"refs/heads/main","pushedAt":"2024-06-05T22:25:18.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Docs] Add Ray Summit CFP (#5295)","shortMessageHtmlLink":"[Docs] Add Ray Summit CFP (#5295)"}},{"before":"0f83ddd4d71ce1a80cfcaff085b40fef83d1a750","after":"6a7c7711a2588ca4a5e713e5335122988f8c0a55","ref":"refs/heads/main","pushedAt":"2024-06-05T22:19:02.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Misc] Skip for logits_scale == 1.0 (#5291)","shortMessageHtmlLink":"[Misc] Skip for logits_scale == 1.0 (#5291)"}},{"before":"065aff6c16bd563acc449b1dae6a99256cfbdeb8","after":"0f83ddd4d71ce1a80cfcaff085b40fef83d1a750","ref":"refs/heads/main","pushedAt":"2024-06-05T22:18:13.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Bugfix][Frontend/Core] Don't log exception when AsyncLLMEngine gracefully shuts down. (#5290)","shortMessageHtmlLink":"[Bugfix][Frontend/Core] Don't log exception when AsyncLLMEngine grace…"}},{"before":"3d33e372a14614b13a793f374e59bddb3027527e","after":"065aff6c16bd563acc449b1dae6a99256cfbdeb8","ref":"refs/heads/main","pushedAt":"2024-06-05T22:16:56.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Bugfix] Make EngineArgs use named arguments for config construction (#5285)","shortMessageHtmlLink":"[Bugfix] Make EngineArgs use named arguments for config construction (#…"}},{"before":"faf71bcd4b11b6d350431f432af08ccd9f30016f","after":"3d33e372a14614b13a793f374e59bddb3027527e","ref":"refs/heads/main","pushedAt":"2024-06-05T21:53:16.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[BugFix] Fix log message about default max model length (#5284)","shortMessageHtmlLink":"[BugFix] Fix log message about default max model length (#5284)"}},{"before":"f270a3953770547d5f8783320897870fcd031884","after":"faf71bcd4b11b6d350431f432af08ccd9f30016f","ref":"refs/heads/main","pushedAt":"2024-06-05T21:53:06.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Speculative Decoding] Add `ProposerWorkerBase` abstract class (#5252)","shortMessageHtmlLink":"[Speculative Decoding] Add ProposerWorkerBase abstract class (#5252)"}},{"before":"8819df91dd66c155658de5e83b8caef5ef8a4a80","after":"6475b54a5bbeb6b68f3cff68cce1cca110e4d476","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T20:47:40.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"Compatible with compute_logits","shortMessageHtmlLink":"Compatible with compute_logits"}},{"before":"b0b42d8dde18cd327fa71d250f46538f002c81b6","after":"8819df91dd66c155658de5e83b8caef5ef8a4a80","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T20:23:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"Remove TPU models","shortMessageHtmlLink":"Remove TPU models"}},{"before":"2e8860a6e2c88f39d3230c0a6f6560c9617045fc","after":"b0b42d8dde18cd327fa71d250f46538f002c81b6","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T20:21:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"Remove benchmarking scripts","shortMessageHtmlLink":"Remove benchmarking scripts"}},{"before":"ca9283a8dccaa92095a423804b10ffa6607294c0","after":"2e8860a6e2c88f39d3230c0a6f6560c9617045fc","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T20:20:03.000Z","pushType":"push","commitsCount":20,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"Merge branch 'main' into torch-xla","shortMessageHtmlLink":"Merge branch 'main' into torch-xla"}},{"before":null,"after":"7c52473c068a7b8ac325ddbed15e95962159e50e","ref":"refs/heads/fix-logits","pushedAt":"2024-06-05T19:52:26.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"[Misc] Skip for logits_scale == 1.0","shortMessageHtmlLink":"[Misc] Skip for logits_scale == 1.0"}},{"before":"a18fbe778d6e32f3e32cc8350d75e1da5a00364b","after":"79d0c43116e42f4312c4f9b253f1f8f3f0508b33","ref":"refs/heads/avoid_tokens_copy","pushedAt":"2024-06-05T19:46:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Yard1","name":"Antoni Baum","path":"/Yard1","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10364161?s=80&v=4"},"commit":{"message":"Update vllm/model_executor/sampling_metadata.py","shortMessageHtmlLink":"Update vllm/model_executor/sampling_metadata.py"}},{"before":"f270a3953770547d5f8783320897870fcd031884","after":"a18fbe778d6e32f3e32cc8350d75e1da5a00364b","ref":"refs/heads/avoid_tokens_copy","pushedAt":"2024-06-05T19:26:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"Yard1","name":"Antoni Baum","path":"/Yard1","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10364161?s=80&v=4"},"commit":{"message":"[Core] Avoid copying prompt/output tokens if no penalties are used","shortMessageHtmlLink":"[Core] Avoid copying prompt/output tokens if no penalties are used"}},{"before":null,"after":"f270a3953770547d5f8783320897870fcd031884","ref":"refs/heads/avoid_tokens_copy","pushedAt":"2024-06-05T19:26:26.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"Yard1","name":"Antoni Baum","path":"/Yard1","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10364161?s=80&v=4"},"commit":{"message":"[Docs] Add Sequoia as sponsors (#5287)","shortMessageHtmlLink":"[Docs] Add Sequoia as sponsors (#5287)"}},{"before":"51a08e7d8f0f11411d380c007ab606fc2d5e3cf9","after":"f270a3953770547d5f8783320897870fcd031884","ref":"refs/heads/main","pushedAt":"2024-06-05T18:02:56.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Docs] Add Sequoia as sponsors (#5287)","shortMessageHtmlLink":"[Docs] Add Sequoia as sponsors (#5287)"}},{"before":"eb8fcd266686570a1cfdcda4af73af0e27b0f3d8","after":"51a08e7d8f0f11411d380c007ab606fc2d5e3cf9","ref":"refs/heads/main","pushedAt":"2024-06-05T17:59:15.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Kernel] Re-tune Mixtral MoE configurations for FP8 on H100 (#5238)","shortMessageHtmlLink":"[Kernel] Re-tune Mixtral MoE configurations for FP8 on H100 (#5238)"}},{"before":"5563a4dea86e62a560c8c99537ce614d5de894e0","after":"eb8fcd266686570a1cfdcda4af73af0e27b0f3d8","ref":"refs/heads/main","pushedAt":"2024-06-05T17:59:02.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[BugFix] Apply get_cached_tokenizer to the tokenizer setter of LLM (#5207)\n\nCo-authored-by: qiujiawei9 ","shortMessageHtmlLink":"[BugFix] Apply get_cached_tokenizer to the tokenizer setter of LLM (#…"}},{"before":"ccd4f129e8ad95191b3c8d6d0e935382b10c5164","after":"5563a4dea86e62a560c8c99537ce614d5de894e0","ref":"refs/heads/main","pushedAt":"2024-06-05T17:58:51.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Model] Correct Mixtral FP8 checkpoint loading (#5231)","shortMessageHtmlLink":"[Model] Correct Mixtral FP8 checkpoint loading (#5231)"}},{"before":"02cc3b51a7f2af012a8f17f0d836529d57012eee","after":"ccd4f129e8ad95191b3c8d6d0e935382b10c5164","ref":"refs/heads/main","pushedAt":"2024-06-05T17:44:15.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Kernel] Add GPU architecture guards to the CUTLASS w8a8 kernels to reduce binary size (#5157)\n\nCo-authored-by: Cody Yu ","shortMessageHtmlLink":"[Kernel] Add GPU architecture guards to the CUTLASS w8a8 kernels to r…"}},{"before":"d5b1eb081e193c54ac21390a0f6ba7013e4f3b11","after":"02cc3b51a7f2af012a8f17f0d836529d57012eee","ref":"refs/heads/main","pushedAt":"2024-06-05T17:17:51.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[misc] benchmark_serving.py -- add ITL results and tweak TPOT results (#5263)","shortMessageHtmlLink":"[misc] benchmark_serving.py -- add ITL results and tweak TPOT results ("}},{"before":"f0a500545f97d026c3873e8dc0043e06e42ae61c","after":"d5b1eb081e193c54ac21390a0f6ba7013e4f3b11","ref":"refs/heads/main","pushedAt":"2024-06-05T16:42:08.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[CI] Add nightly benchmarks (#5260)","shortMessageHtmlLink":"[CI] Add nightly benchmarks (#5260)"}},{"before":"c65146e75e71f72bdb93542efdc40c87caccb42e","after":"f0a500545f97d026c3873e8dc0043e06e42ae61c","ref":"refs/heads/main","pushedAt":"2024-06-05T16:32:58.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"simon-mo","name":"Simon Mo","path":"/simon-mo","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21118851?s=80&v=4"},"commit":{"message":"[Frontend] OpenAI API server: Add `add_special_tokens` to ChatCompletionRequest (default False) (#5278)","shortMessageHtmlLink":"[Frontend] OpenAI API server: Add add_special_tokens to ChatComplet…"}},{"before":"ac810b58658041db8379bd5533a6a75b243316c3","after":null,"ref":"refs/heads/minor-attn-fix","pushedAt":"2024-06-05T16:19:05.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"}},{"before":"41ca62cf03b31deb68dbc14e4a92a1d4579de08b","after":"c65146e75e71f72bdb93542efdc40c87caccb42e","ref":"refs/heads/main","pushedAt":"2024-06-05T16:18:59.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"[Misc] Fix docstring of get_attn_backend (#5271)","shortMessageHtmlLink":"[Misc] Fix docstring of get_attn_backend (#5271)"}},{"before":"d1182e717fee4cd87cb19379eb67837296ffba22","after":null,"ref":"refs/heads/dispatcher","pushedAt":"2024-06-05T16:18:22.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"}},{"before":"974fc9b8455ec6c210534c176fd7d1245ca43261","after":"41ca62cf03b31deb68dbc14e4a92a1d4579de08b","ref":"refs/heads/main","pushedAt":"2024-06-05T16:18:19.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"[Misc] Add CustomOp interface for device portability (#5255)","shortMessageHtmlLink":"[Misc] Add CustomOp interface for device portability (#5255)"}},{"before":"e0e252b49e6ea4688a133626f2e9923891041b04","after":"ca9283a8dccaa92095a423804b10ffa6607294c0","ref":"refs/heads/torch-xla","pushedAt":"2024-06-05T08:34:17.000Z","pushType":"push","commitsCount":294,"pusher":{"login":"WoosukKwon","name":"Woosuk Kwon","path":"/WoosukKwon","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/46394894?s=80&v=4"},"commit":{"message":"Model loader & yapf","shortMessageHtmlLink":"Model loader & yapf"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEXaXgdwA","startCursor":null,"endCursor":null}},"title":"Activity · vllm-project/vllm"}