{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":682213669,"defaultBranch":"main","name":"vllm","ownerLogin":"ymwangg","currentUserCanPush":false,"isFork":true,"isEmpty":false,"createdAt":"2023-08-23T17:30:42.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/19481308?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1722361963.0","currentOid":""},"activityList":{"items":[{"before":null,"after":"e834faaf31f77f03a147c6f8c52f40f368a8d315","ref":"refs/heads/specdec_v0.5.0.post1","pushedAt":"2024-07-30T17:52:43.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix async_llm_engine","shortMessageHtmlLink":"Fix async_llm_engine"}},{"before":"acbed3ef40f015fcf64460e629813922fab90380","after":"1744cc99ba9bdefea8f3f798cf51ed650b81a98e","ref":"refs/heads/main","pushedAt":"2024-07-23T20:50:44.000Z","pushType":"push","commitsCount":1300,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"[Doc] Add Phi-3-medium to list of supported models (#5788)","shortMessageHtmlLink":"[Doc] Add Phi-3-medium to list of supported models (vllm-project#5788)"}},{"before":"f013f21cf1e42141ba4ccb28f963ebbc72572614","after":"fe68019543c93e04355ccff9617e983bed27b660","ref":"refs/heads/specdec_v0.4.2","pushedAt":"2024-06-24T21:41:22.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix reject_sample","shortMessageHtmlLink":"Fix reject_sample"}},{"before":"6e5c169f00976bb2b64f9dbf22c52c2bebb91daa","after":"f013f21cf1e42141ba4ccb28f963ebbc72572614","ref":"refs/heads/specdec_v0.4.2","pushedAt":"2024-06-24T21:39:43.000Z","pushType":"push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":null,"after":"6e5c169f00976bb2b64f9dbf22c52c2bebb91daa","ref":"refs/heads/specdec_v0.4.2","pushedAt":"2024-06-17T23:08:36.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"init","shortMessageHtmlLink":"init"}},{"before":"0f69ccf841570533ca4b9f27893440ba37aba0c1","after":"d7163dedd79e6f3c282872aea47f785acd40f9eb","ref":"refs/heads/log_cudagraph_memory_usage","pushedAt":"2024-06-13T21:30:33.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"[Logging] Log cudagraph memory usage","shortMessageHtmlLink":"[Logging] Log cudagraph memory usage"}},{"before":"bc0ef2d73f9fbf169a6536cb0bf40b9717907b28","after":"0f69ccf841570533ca4b9f27893440ba37aba0c1","ref":"refs/heads/log_cudagraph_memory_usage","pushedAt":"2024-06-13T21:27:31.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":null,"after":"bc0ef2d73f9fbf169a6536cb0bf40b9717907b28","ref":"refs/heads/log_cudagraph_memory_usage","pushedAt":"2024-06-13T21:15:06.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":null,"after":"82d8d45083445409d9fd134fcebe74326a2adcfe","ref":"refs/heads/specdec_v0.3.3_v2_flash_attn_sliding_window","pushedAt":"2024-04-08T21:10:21.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Add sliding_window support","shortMessageHtmlLink":"Add sliding_window support"}},{"before":null,"after":"15339c74367d2d73c111ec16173e12a56eda605b","ref":"refs/heads/specdec_v0.3.3_v2_flash_attn_fast_sampler","pushedAt":"2024-03-28T20:37:48.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Use simplified sampler for draft model","shortMessageHtmlLink":"Use simplified sampler for draft model"}},{"before":"daad7ba57c14ef20996fb4fa26a50589425a5bec","after":"9b51ee9975ee4917e8021b7372c30e50a1a29288","ref":"refs/heads/specdec_v0.3.3","pushedAt":"2024-03-26T17:54:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix blocks padding issue","shortMessageHtmlLink":"Fix blocks padding issue"}},{"before":"fe5c675050a09e2094c6a0ecef5fccee5f0b2205","after":"d27aebe2264d9ece950c5d5c2e76a5a8ccb5de56","ref":"refs/heads/specdec_v0.3.3_v2_flash_attn","pushedAt":"2024-03-26T17:52:19.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix blocks padding issue","shortMessageHtmlLink":"Fix blocks padding issue"}},{"before":"8ab38b3e01b80321931c7f1cadb63b92df492005","after":"fe5c675050a09e2094c6a0ecef5fccee5f0b2205","ref":"refs/heads/specdec_v0.3.3_v2_flash_attn","pushedAt":"2024-03-19T17:13:16.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix get_logits function in sampler for speculative decoding","shortMessageHtmlLink":"Fix get_logits function in sampler for speculative decoding"}},{"before":"93caeead8dde7426beb3d166a903dfbf79fcfe1b","after":"daad7ba57c14ef20996fb4fa26a50589425a5bec","ref":"refs/heads/specdec_v0.3.3","pushedAt":"2024-03-19T17:12:15.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix get_logits function in sampler for speculative decoding","shortMessageHtmlLink":"Fix get_logits function in sampler for speculative decoding"}},{"before":null,"after":"8ab38b3e01b80321931c7f1cadb63b92df492005","ref":"refs/heads/specdec_v0.3.3_v2_flash_attn","pushedAt":"2024-03-18T23:29:52.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Use flash_attn_kv_cache to replace Triton MQA kernel","shortMessageHtmlLink":"Use flash_attn_kv_cache to replace Triton MQA kernel"}},{"before":null,"after":"15b3de4fd6aac9844823878f2f4f24ddba215cfa","ref":"refs/heads/specdec_flash_attn","pushedAt":"2024-03-18T18:26:35.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Use fast greedy sampling for draft model","shortMessageHtmlLink":"Use fast greedy sampling for draft model"}},{"before":null,"after":"15b3de4fd6aac9844823878f2f4f24ddba215cfa","ref":"refs/heads/specdec_v0.3.2_v2","pushedAt":"2024-03-14T17:33:46.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Use fast greedy sampling for draft model","shortMessageHtmlLink":"Use fast greedy sampling for draft model"}},{"before":"0bb553a60403f121efd6cb9e097dbe15d890285b","after":"93caeead8dde7426beb3d166a903dfbf79fcfe1b","ref":"refs/heads/specdec_v0.3.3","pushedAt":"2024-03-14T01:19:26.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Initial support of speculative decoding\n\nCo-authored-by: Jie Wang \n\nFix greedy sampling in speculative decoding\n\nAdd back pre-emption by recompute support\n\nAdd logprobs support for speculative decoding.\n\nFix prompt_logprobs and add stop_str support","shortMessageHtmlLink":"Initial support of speculative decoding"}},{"before":null,"after":"0bb553a60403f121efd6cb9e097dbe15d890285b","ref":"refs/heads/specdec_v0.3.3","pushedAt":"2024-03-14T00:39:35.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"69a49afe09c6f2bb905c79aa1f86e6bb1d85a225","after":null,"ref":"refs/heads/specdec_v0.3.2_fast_draft_sampler","pushedAt":"2024-03-04T19:46:16.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":null,"after":"69a49afe09c6f2bb905c79aa1f86e6bb1d85a225","ref":"refs/heads/specdec_v0.3.2_fast_draft_sampler","pushedAt":"2024-03-04T19:45:32.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"5e3a872d94d8f0e6bbe90a278ae60a16f2c8b675","after":"97b74ffd146878064e477c1bf1fabb42da7c113f","ref":"refs/heads/specdec_v0.1.2","pushedAt":"2024-02-28T18:51:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix typo","shortMessageHtmlLink":"Fix typo"}},{"before":"5e3a872d94d8f0e6bbe90a278ae60a16f2c8b675","after":"fccb32a3637b4bed87e89267846dbd9f99617db8","ref":"refs/heads/specdec_v0.3.2","pushedAt":"2024-02-28T18:51:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Fix typo","shortMessageHtmlLink":"Fix typo"}},{"before":"5ed46878c2a4602ff41b14dfb1d8f9a46d8e7be0","after":"5e3a872d94d8f0e6bbe90a278ae60a16f2c8b675","ref":"refs/heads/specdec_v0.3.2","pushedAt":"2024-02-28T01:29:59.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Initial support of speculative decoding\n\nCo-authored-by: Jie Wang \n\nFix greedy sampling in speculative decoding\n\nAdd back pre-emption by recompute support\n\nAdd logprobs support for speculative decoding.\n\nFix prompt_logprobs and add stop_str support","shortMessageHtmlLink":"Initial support of speculative decoding"}},{"before":"5fb432ca081aba905c1794214006c7a32864910c","after":"5e3a872d94d8f0e6bbe90a278ae60a16f2c8b675","ref":"refs/heads/specdec_v0.1.2","pushedAt":"2024-02-28T01:29:39.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"},"commit":{"message":"Initial support of speculative decoding\n\nCo-authored-by: Jie Wang \n\nFix greedy sampling in speculative decoding\n\nAdd back pre-emption by recompute support\n\nAdd logprobs support for speculative decoding.\n\nFix prompt_logprobs and add stop_str support","shortMessageHtmlLink":"Initial support of speculative decoding"}},{"before":"0ef59203a8f0c83af862292f42cd96dfa292b3a9","after":"5fb432ca081aba905c1794214006c7a32864910c","ref":"refs/heads/specdec_v0.1.2","pushedAt":"2024-02-28T01:14:32.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"0ef59203a8f0c83af862292f42cd96dfa292b3a9","after":"5ed46878c2a4602ff41b14dfb1d8f9a46d8e7be0","ref":"refs/heads/specdec_v0.3.2","pushedAt":"2024-02-28T01:14:00.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"192a132e915f90a228002931e92ac680244cc8fa","after":"0ef59203a8f0c83af862292f42cd96dfa292b3a9","ref":"refs/heads/specdec_v0.3.2","pushedAt":"2024-02-28T01:09:24.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"06ef60272e790706f6ccce70403e8c34d33e5352","after":"0ef59203a8f0c83af862292f42cd96dfa292b3a9","ref":"refs/heads/specdec_v0.1.2","pushedAt":"2024-02-28T01:08:42.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}},{"before":"a04f6be781c3c004ae425a759ffc785a6f598d77","after":"06ef60272e790706f6ccce70403e8c34d33e5352","ref":"refs/heads/specdec_v0.1.2","pushedAt":"2024-02-27T22:18:43.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"ymwangg","name":"Yanming W.","path":"/ymwangg","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/19481308?s=80&v=4"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"startCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wNy0zMFQxNzo1Mjo0My4wMDAwMDBazwAAAASNRf_I","endCursor":"Y3Vyc29yOnYyOpK7MjAyNC0wMi0yN1QyMjoxODo0My4wMDAwMDBazwAAAAQHBB3V"}},"title":"Activity ยท ymwangg/vllm"}