{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":757458337,"defaultBranch":"main","name":"ring-attention-pytorch","ownerLogin":"lucidrains","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2024-02-14T14:37:51.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/108653?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1720752853.0","currentOid":""},"activityList":{"items":[{"before":"604803bba91802a95e0731fd6bbe248432fd094c","after":"ebf8ab65747d476f950f97fefcaacc10304de176","ref":"refs/heads/main","pushedAt":"2024-07-12T02:54:07.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"better error messages if triton 3.0 not installed","shortMessageHtmlLink":"better error messages if triton 3.0 not installed"}},{"before":"76266d5220f9fcde06e6765dfe876814ec225734","after":"604803bba91802a95e0731fd6bbe248432fd094c","ref":"refs/heads/main","pushedAt":"2024-07-11T16:17:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"better error messages if triton 3.0 not installed","shortMessageHtmlLink":"better error messages if triton 3.0 not installed"}},{"before":"6210e0fcedbc774f1391cd6efd6be601bb9a711c","after":"76266d5220f9fcde06e6765dfe876814ec225734","ref":"refs/heads/main","pushedAt":"2024-07-08T03:27:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"enforce triton nightly","shortMessageHtmlLink":"enforce triton nightly"}},{"before":"243a6e6a4067b6db9a1df29a7b3618ef8520dbe6","after":"6210e0fcedbc774f1391cd6efd6be601bb9a711c","ref":"refs/heads/main","pushedAt":"2024-07-06T17:34:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"complete softclamping for ring flash attn cuda","shortMessageHtmlLink":"complete softclamping for ring flash attn cuda"}},{"before":"6eca0925a6bdcf369694d62bf40cc20dc8d2fdc5","after":"243a6e6a4067b6db9a1df29a7b3618ef8520dbe6","ref":"refs/heads/main","pushedAt":"2024-07-06T17:26:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"first make sure dv passes for ring_flash_attn_cuda","shortMessageHtmlLink":"first make sure dv passes for ring_flash_attn_cuda"}},{"before":"209591a38217a63a592d8d120abe3d707c386fda","after":"6eca0925a6bdcf369694d62bf40cc20dc8d2fdc5","ref":"refs/heads/main","pushedAt":"2024-07-06T17:10:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"make forward pass work for ring_flash_attn_cuda","shortMessageHtmlLink":"make forward pass work for ring_flash_attn_cuda"}},{"before":"44f980134c2ea5fce2273a717cdd246c4d5e165f","after":"209591a38217a63a592d8d120abe3d707c386fda","ref":"refs/heads/main","pushedAt":"2024-07-05T04:50:03.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"redo softclamp backwards pass to line up with how the cuda version may look","shortMessageHtmlLink":"redo softclamp backwards pass to line up with how the cuda version ma…"}},{"before":"ea485d075cb1265de24422f41b8b95974cb3f2d4","after":"44f980134c2ea5fce2273a717cdd246c4d5e165f","ref":"refs/heads/main","pushedAt":"2024-07-05T02:39:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"redo softclamp backwards pass to line up with how the cuda version may look","shortMessageHtmlLink":"redo softclamp backwards pass to line up with how the cuda version ma…"}},{"before":"01962071ac13a1bf35fdca90b1e0bd70c660f313","after":"ea485d075cb1265de24422f41b8b95974cb3f2d4","ref":"refs/heads/main","pushedAt":"2024-07-04T12:42:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"address an issue with rotary https://github.com/lucidrains/ring-attention-pytorch/issues/15","shortMessageHtmlLink":"address an issue with rotary #15"}},{"before":"e46258b39d527b114042e41ee07c65dc4ad26c8a","after":"01962071ac13a1bf35fdca90b1e0bd70c660f313","ref":"refs/heads/main","pushedAt":"2024-07-02T23:54:10.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"first make sure softclamping of qk sim can be carried out with naive ring flash attention","shortMessageHtmlLink":"first make sure softclamping of qk sim can be carried out with naive …"}},{"before":"ef37f92d4971ccc5f26acb1e8453c6f5d52bcfb5","after":"e46258b39d527b114042e41ee07c65dc4ad26c8a","ref":"refs/heads/main","pushedAt":"2024-07-02T23:53:02.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"first make sure softclamping of qk sim can be carried out with naive ring flash attention","shortMessageHtmlLink":"first make sure softclamping of qk sim can be carried out with naive …"}},{"before":"70f147238d0f925ce1204f429bf561ed7730f43b","after":"ef37f92d4971ccc5f26acb1e8453c6f5d52bcfb5","ref":"refs/heads/main","pushedAt":"2024-07-02T22:19:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"first make sure softclamping of qk sim can be carried out with naive ring flash attention","shortMessageHtmlLink":"first make sure softclamping of qk sim can be carried out with naive …"}},{"before":"6138cce3454f11ab8852ec190f03730bdfe8ddf7","after":"70f147238d0f925ce1204f429bf561ed7730f43b","ref":"refs/heads/main","pushedAt":"2024-07-02T21:54:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cleanup with future annotations","shortMessageHtmlLink":"cleanup with future annotations"}},{"before":"e745c6d4792401cacc28d2345838aa5bc4718419","after":"6138cce3454f11ab8852ec190f03730bdfe8ddf7","ref":"refs/heads/main","pushedAt":"2024-04-20T15:25:21.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add support for grouped query attention","shortMessageHtmlLink":"add support for grouped query attention"}},{"before":"8faa05ebbfd2071a064635ec918121c3b05d433d","after":"e745c6d4792401cacc28d2345838aa5bc4718419","ref":"refs/heads/main","pushedAt":"2024-04-20T14:08:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add support for grouped query attention","shortMessageHtmlLink":"add support for grouped query attention"}},{"before":"5fd1e484ec00a5b7842018a6c2b1edcc3ee2058b","after":"8faa05ebbfd2071a064635ec918121c3b05d433d","ref":"refs/heads/main","pushedAt":"2024-04-16T13:55:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"idea","shortMessageHtmlLink":"idea"}},{"before":"aa7be57916aaaa8b7a058c9c52d0c8f9dd4ecee5","after":"5fd1e484ec00a5b7842018a6c2b1edcc3ee2058b","ref":"refs/heads/main","pushedAt":"2024-04-11T17:00:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add beartype decorator to RingRotaryEmbedding","shortMessageHtmlLink":"add beartype decorator to RingRotaryEmbedding"}},{"before":"9cbbb50783171283e4e4275fb71de9afd87e705b","after":"aa7be57916aaaa8b7a058c9c52d0c8f9dd4ecee5","ref":"refs/heads/main","pushedAt":"2024-04-11T14:57:13.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cleanup","shortMessageHtmlLink":"cleanup"}},{"before":"fba8e150d5cfd711d1358abeef1d8deb927c27d3","after":"9cbbb50783171283e4e4275fb71de9afd87e705b","ref":"refs/heads/main","pushedAt":"2024-04-11T14:53:37.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"relevant essay","shortMessageHtmlLink":"relevant essay"}},{"before":"9f6d8ffdd9e9ecf0df8e608f90710e2efbe91214","after":"fba8e150d5cfd711d1358abeef1d8deb927c27d3","ref":"refs/heads/main","pushedAt":"2024-04-11T14:52:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"pithy quote","shortMessageHtmlLink":"pithy quote"}},{"before":"509831ebd98bbd7745f2d1bef7783abb2c0c407b","after":"9f6d8ffdd9e9ecf0df8e608f90710e2efbe91214","ref":"refs/heads/main","pushedAt":"2024-04-11T14:40:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"no need to .view(dtype) as kv and dkv are now the same dtype","shortMessageHtmlLink":"no need to .view(dtype) as kv and dkv are now the same dtype"}},{"before":"24e1673cfb9206ee2ec807e735f677f53e965093","after":"509831ebd98bbd7745f2d1bef7783abb2c0c407b","ref":"refs/heads/main","pushedAt":"2024-04-11T03:42:29.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"0.3.19","shortMessageHtmlLink":"0.3.19"}},{"before":"d823c70aae1a06d62b982291a637f4e262393d26","after":"24e1673cfb9206ee2ec807e735f677f53e965093","ref":"refs/heads/main","pushedAt":"2024-04-11T03:27:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"may be safe to accumulate dk and dv as same type as k and v in flash cuda kernel backwards, saving some communication costs","shortMessageHtmlLink":"may be safe to accumulate dk and dv as same type as k and v in flash …"}},{"before":"61fa96704c1f90773fbb8b416c95bb788dcfacfd","after":"d823c70aae1a06d62b982291a637f4e262393d26","ref":"refs/heads/main","pushedAt":"2024-04-11T00:47:17.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"just go entirely with triton flash attention forwards and backwards. validate that non-causal key padding works","shortMessageHtmlLink":"just go entirely with triton flash attention forwards and backwards. …"}},{"before":"68237946e26752becfbe46374bbc8e31b82beeb8","after":"61fa96704c1f90773fbb8b416c95bb788dcfacfd","ref":"refs/heads/main","pushedAt":"2024-04-11T00:33:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"just go entirely with triton flash attention forwards and backwards. validate that non-causal key padding works","shortMessageHtmlLink":"just go entirely with triton flash attention forwards and backwards. …"}},{"before":"7e81a42eea570fd9cb5d9700fcd66855ebad2c69","after":"68237946e26752becfbe46374bbc8e31b82beeb8","ref":"refs/heads/main","pushedAt":"2024-04-10T19:38:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cache the preprocess backwards kernel output across the ring reduce","shortMessageHtmlLink":"cache the preprocess backwards kernel output across the ring reduce"}},{"before":"de475758a914a35748eabaeaa9b6b6f2b006ad20","after":"7e81a42eea570fd9cb5d9700fcd66855ebad2c69","ref":"refs/heads/main","pushedAt":"2024-04-10T17:57:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"retest triton backwards on runpod","shortMessageHtmlLink":"retest triton backwards on runpod"}},{"before":"b539d13fc1a000f999904a9377c478bef3403641","after":"de475758a914a35748eabaeaa9b6b6f2b006ad20","ref":"refs/heads/main","pushedAt":"2024-04-10T17:48:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"more cleanup","shortMessageHtmlLink":"more cleanup"}},{"before":"7ba563e5e0d4fbebe757e56ec3fc0f0b40de992d","after":"b539d13fc1a000f999904a9377c478bef3403641","ref":"refs/heads/main","pushedAt":"2024-04-10T17:31:54.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cleanup test scripts","shortMessageHtmlLink":"cleanup test scripts"}},{"before":"6f3d631adbec4024d79df54b5ee521b2b58053f8","after":null,"ref":"refs/heads/use-triton-flash-attn-backwards","pushedAt":"2024-04-10T17:29:31.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEfW38GQA","startCursor":null,"endCursor":null}},"title":"Activity · lucidrains/ring-attention-pytorch"}