{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":683747677,"defaultBranch":"main","name":"speculative-decoding","ownerLogin":"lucidrains","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-08-27T15:22:52.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/108653?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1696436205.0","currentOid":""},"activityList":{"items":[{"before":"457af7e8cdd2370ed2c5640c9ebd70ba7fafa1fa","after":"fc44a585af41b998d80ada8c4ce00a61b098d098","ref":"refs/heads/main","pushedAt":"2023-10-09T20:09:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cleanup","shortMessageHtmlLink":"cleanup"}},{"before":"8eed2a047a9f42d73e37b04ea786f5001bc12238","after":"457af7e8cdd2370ed2c5640c9ebd70ba7fafa1fa","ref":"refs/heads/main","pushedAt":"2023-10-08T16:28:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cite medusa, as using the last layer hiddens is exactly what the prophet idea was, save for using a full blown transformer as the medusa head..","shortMessageHtmlLink":"cite medusa, as using the last layer hiddens is exactly what the prop…"}},{"before":"f06caf26d145185a5767741205e4d8c6633c5e32","after":"8eed2a047a9f42d73e37b04ea786f5001bc12238","ref":"refs/heads/main","pushedAt":"2023-10-08T15:57:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cite similar paper to early exit","shortMessageHtmlLink":"cite similar paper to early exit"}},{"before":"4b77f264f92d38cb2756f5adc12714fbf53b8cbd","after":"f06caf26d145185a5767741205e4d8c6633c5e32","ref":"refs/heads/main","pushedAt":"2023-10-04T23:26:12.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fix sampling for num leading start tokens > 1 in prophet scheme","shortMessageHtmlLink":"fix sampling for num leading start tokens > 1 in prophet scheme"}},{"before":"5e8b0363ee6aa9565594e01d1e5eebdd23a983f4","after":"4b77f264f92d38cb2756f5adc12714fbf53b8cbd","ref":"refs/heads/main","pushedAt":"2023-10-04T16:16:38.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"generalize to any number of leading start tokens for prophet","shortMessageHtmlLink":"generalize to any number of leading start tokens for prophet"}},{"before":"2315a8a66a7bf56a0b0a06e82fbd6d7b62cb163f","after":"5e8b0363ee6aa9565594e01d1e5eebdd23a983f4","ref":"refs/heads/main","pushedAt":"2023-10-04T15:43:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"the extra norm in projecting to prophet model dimensions hurt for some reason","shortMessageHtmlLink":"the extra norm in projecting to prophet model dimensions hurt for som…"}},{"before":"df892633e3f5c882f98f835d9330f10c2f29a658","after":"2315a8a66a7bf56a0b0a06e82fbd6d7b62cb163f","ref":"refs/heads/main","pushedAt":"2023-10-03T15:25:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"clip prophet gradients too","shortMessageHtmlLink":"clip prophet gradients too"}},{"before":"45affc09db48075c8a000245f44dbea534997fa5","after":"df892633e3f5c882f98f835d9330f10c2f29a658","ref":"refs/heads/main","pushedAt":"2023-10-03T15:10:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"research management","shortMessageHtmlLink":"research management"}},{"before":"ffc6e0686819bfe9399d6fecd0c2ff4e3747752b","after":"45affc09db48075c8a000245f44dbea534997fa5","ref":"refs/heads/main","pushedAt":"2023-10-03T15:08:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"negative control","shortMessageHtmlLink":"negative control"}},{"before":"f4e55c4d240942a565c92664724fa2419f8e8265","after":"ffc6e0686819bfe9399d6fecd0c2ff4e3747752b","ref":"refs/heads/main","pushedAt":"2023-10-03T15:00:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"functional","shortMessageHtmlLink":"functional"}},{"before":"46408b036b6f822794bff1465aa838ee27d8bb7c","after":"f4e55c4d240942a565c92664724fa2419f8e8265","ref":"refs/heads/main","pushedAt":"2023-10-03T14:59:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"complete speculative sampling with prophet net on cached embeddings idea!","shortMessageHtmlLink":"complete speculative sampling with prophet net on cached embeddings i…"}},{"before":"983573b725b7d3dec77348fc491d61bfe8783585","after":"46408b036b6f822794bff1465aa838ee27d8bb7c","ref":"refs/heads/main","pushedAt":"2023-10-02T18:59:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"credit assignment","shortMessageHtmlLink":"credit assignment"}},{"before":"78fde6f31a2816f10fb43af6f0634287f69d4616","after":"983573b725b7d3dec77348fc491d61bfe8783585","ref":"refs/heads/main","pushedAt":"2023-10-02T17:47:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"facepalm","shortMessageHtmlLink":"facepalm"}},{"before":"fd2cc0fe4a965cb9def6bd4b64767a523b34e180","after":"78fde6f31a2816f10fb43af6f0634287f69d4616","ref":"refs/heads/main","pushedAt":"2023-10-02T17:35:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"share idea","shortMessageHtmlLink":"share idea"}},{"before":"94002e54cf2ac93e817f93f08ef9fa5f26a958f0","after":"fd2cc0fe4a965cb9def6bd4b64767a523b34e180","ref":"refs/heads/main","pushedAt":"2023-10-02T17:27:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fix start token and determining input sequence","shortMessageHtmlLink":"fix start token and determining input sequence"}},{"before":"0434d06cf7d88224d0457685c9d6e487606e3c1a","after":"94002e54cf2ac93e817f93f08ef9fa5f26a958f0","ref":"refs/heads/main","pushedAt":"2023-10-02T16:45:36.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"move towards completing what is started","shortMessageHtmlLink":"move towards completing what is started"}},{"before":"43e1543fa2d2942c2da47c131ab651c2db06d522","after":"0434d06cf7d88224d0457685c9d6e487606e3c1a","ref":"refs/heads/main","pushedAt":"2023-10-01T18:22:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"more fixes","shortMessageHtmlLink":"more fixes"}},{"before":"0c45014c28e4dab0bd19872b1488b10f1cad7042","after":"43e1543fa2d2942c2da47c131ab651c2db06d522","ref":"refs/heads/main","pushedAt":"2023-09-26T16:52:32.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"just copy batched spec decoding and make batch early exit strategy work","shortMessageHtmlLink":"just copy batched spec decoding and make batch early exit strategy work"}},{"before":"8e425d480a3ccbdca10467185faec776d139fc68","after":"0c45014c28e4dab0bd19872b1488b10f1cad7042","ref":"refs/heads/main","pushedAt":"2023-09-26T16:50:48.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"just copy batched spec decoding and make batch early exit strategy work","shortMessageHtmlLink":"just copy batched spec decoding and make batch early exit strategy work"}},{"before":"e6ebcdc560ac366d214c1981314ed55c13b15d8d","after":"8e425d480a3ccbdca10467185faec776d139fc68","ref":"refs/heads/main","pushedAt":"2023-09-26T16:24:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fix early exit spec decoding","shortMessageHtmlLink":"fix early exit spec decoding"}},{"before":"565a426b8f3fc1c0c410e496f9382409dfc893d7","after":"e6ebcdc560ac366d214c1981314ed55c13b15d8d","ref":"refs/heads/main","pushedAt":"2023-09-23T16:15:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"project management","shortMessageHtmlLink":"project management"}},{"before":"ef0467c1528981a8d22d412b2360cc8494a21434","after":"565a426b8f3fc1c0c410e496f9382409dfc893d7","ref":"refs/heads/main","pushedAt":"2023-09-23T16:15:03.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"0.0.10","shortMessageHtmlLink":"0.0.10"}},{"before":"98ae7c9392ed0cb23279a374e08c37abe76c754d","after":"ef0467c1528981a8d22d412b2360cc8494a21434","ref":"refs/heads/main","pushedAt":"2023-09-23T16:14:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fixed the main offending issue with perf degradation for batched spec decoding. batched spec decoding has the issue that for high variance in spec decoding, you are always bounded by the worst row performance","shortMessageHtmlLink":"fixed the main offending issue with perf degradation for batched spec…"}},{"before":"7f18431c4a4f3c90819e58c6c3138f8ff90aa3c5","after":"98ae7c9392ed0cb23279a374e08c37abe76c754d","ref":"refs/heads/main","pushedAt":"2023-09-23T15:49:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"confirmed that all the right alignment shifting is what is leading to performance degradation for batch > 1","shortMessageHtmlLink":"confirmed that all the right alignment shifting is what is leading to…"}},{"before":"0f26512718cbe02c5e1b02fb1b953c6ba106198b","after":"7f18431c4a4f3c90819e58c6c3138f8ff90aa3c5","ref":"refs/heads/main","pushedAt":"2023-09-23T15:46:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"keeping track of 7 dimensions must be peak tensor programming","shortMessageHtmlLink":"keeping track of 7 dimensions must be peak tensor programming"}},{"before":"689d45995829f568b2ac53ea8480a0569443ff14","after":"0f26512718cbe02c5e1b02fb1b953c6ba106198b","ref":"refs/heads/main","pushedAt":"2023-09-22T21:29:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"make batched spec decoding work","shortMessageHtmlLink":"make batched spec decoding work"}},{"before":"a011329be1c21ac84cc4d6de9bd24f36e2429241","after":"689d45995829f568b2ac53ea8480a0569443ff14","ref":"refs/heads/main","pushedAt":"2023-09-22T19:21:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"necessary setup for batched speculative decoding","shortMessageHtmlLink":"necessary setup for batched speculative decoding"}},{"before":"c18220ac3e8c07b594ed6179f16180c493c26b8d","after":"a011329be1c21ac84cc4d6de9bd24f36e2429241","ref":"refs/heads/main","pushedAt":"2023-09-20T17:04:23.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"idea explained wrong","shortMessageHtmlLink":"idea explained wrong"}},{"before":"2ac580eb9bde327c98fc0206a52a060874894e7f","after":"c18220ac3e8c07b594ed6179f16180c493c26b8d","ref":"refs/heads/main","pushedAt":"2023-09-20T16:39:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"project management","shortMessageHtmlLink":"project management"}},{"before":"24e90c3fe4db84d7ffa7b89a2d972fc2e72a428e","after":"2ac580eb9bde327c98fc0206a52a060874894e7f","ref":"refs/heads/main","pushedAt":"2023-09-20T16:38:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fix caching in speculative decoding with same model","shortMessageHtmlLink":"fix caching in speculative decoding with same model"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAADkwWAZgA","startCursor":null,"endCursor":null}},"title":"Activity · lucidrains/speculative-decoding"}