{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":640747712,"defaultBranch":"main","name":"MEGABYTE-pytorch","ownerLogin":"lucidrains","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-05-15T03:27:36.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/108653?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1725923287.0","currentOid":""},"activityList":{"items":[{"before":"907b8dcb1a921adf2ac453856c824dab7743f357","after":"e98b62d3da098574b115ead9e50fb2e77cfebf87","ref":"refs/heads/main","pushedAt":"2024-09-09T23:08:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"update torch dep to 2.3","shortMessageHtmlLink":"update torch dep to 2.3"}},{"before":"c17dd1e302256627a82767611dec6db355356bee","after":"907b8dcb1a921adf2ac453856c824dab7743f357","ref":"refs/heads/main","pushedAt":"2024-09-09T23:07:34.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"Merge pull request #18 from eegli/update-flash-attention\n\nchore: update flash attention config","shortMessageHtmlLink":"Merge pull request #18 from eegli/update-flash-attention"}},{"before":"501482afa9a35637c1418dea0291faf3835a2961","after":"c17dd1e302256627a82767611dec6db355356bee","ref":"refs/heads/main","pushedAt":"2024-09-07T12:42:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"rotary embedding done in full prec","shortMessageHtmlLink":"rotary embedding done in full prec"}},{"before":"d95754cbcf535e37fbad9b66ed35d4cb5d992bcf","after":"501482afa9a35637c1418dea0291faf3835a2961","ref":"refs/heads/main","pushedAt":"2024-09-07T12:09:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"address issue with abs pos emb https://github.com/lucidrains/MEGABYTE-pytorch/pull/17","shortMessageHtmlLink":"address issue with abs pos emb #17"}},{"before":"8864b69e47e5f6c7aaed6bcd4e390dc56d2bccae","after":"d95754cbcf535e37fbad9b66ed35d4cb5d992bcf","ref":"refs/heads/main","pushedAt":"2024-05-03T02:13:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"address https://github.com/lucidrains/MEGABYTE-pytorch/issues/13","shortMessageHtmlLink":"address #13"}},{"before":"4066a0c83a31c2414f33778003edd3db2648e13e","after":"8864b69e47e5f6c7aaed6bcd4e390dc56d2bccae","ref":"refs/heads/main","pushedAt":"2023-06-15T20:12:26.596Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"make sure it supports greater than 2 hierarchies","shortMessageHtmlLink":"make sure it supports greater than 2 hierarchies"}},{"before":"810d77a9befcc36018826cfce6ce1a6de73af893","after":"4066a0c83a31c2414f33778003edd3db2648e13e","ref":"refs/heads/main","pushedAt":"2023-06-15T19:38:03.758Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"move closer to what the paper did, with local and global token embeddings not shared","shortMessageHtmlLink":"move closer to what the paper did, with local and global token embedd…"}},{"before":"3eafa96032cb5b1c35c5e805ce118566682a46ef","after":"810d77a9befcc36018826cfce6ce1a6de73af893","ref":"refs/heads/main","pushedAt":"2023-06-15T18:13:40.008Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"switch to rotary embeddings, as they did in the paper","shortMessageHtmlLink":"switch to rotary embeddings, as they did in the paper"}},{"before":"6ac90ea712d5a154d3c58e2683d0033c09dfdf64","after":"3eafa96032cb5b1c35c5e805ce118566682a46ef","ref":"refs/heads/main","pushedAt":"2023-06-14T16:50:27.426Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"evidence is emerging that decoders generate implicit absolute and relative positions without help","shortMessageHtmlLink":"evidence is emerging that decoders generate implicit absolute and rel…"}},{"before":"2889898182ea14bc2ad3e4775994c48a5fcad2ce","after":"6ac90ea712d5a154d3c58e2683d0033c09dfdf64","ref":"refs/heads/main","pushedAt":"2023-05-31T01:01:22.649Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"address https://github.com/lucidrains/MEGABYTE-pytorch/issues/10","shortMessageHtmlLink":"address #10"}},{"before":"93d8a45e88f164474109742aaa27a8462f8e46cc","after":"2889898182ea14bc2ad3e4775994c48a5fcad2ce","ref":"refs/heads/main","pushedAt":"2023-05-29T17:42:03.200Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"learn on the very first start token","shortMessageHtmlLink":"learn on the very first start token"}},{"before":"46d3f147d5f01f038bf8ff526d9a193079e6e5ff","after":null,"ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:52:56.248Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"}},{"before":"fe82b1df7185679a80e606ee326657460d0f2f16","after":"93d8a45e88f164474109742aaa27a8462f8e46cc","ref":"refs/heads/main","pushedAt":"2023-05-29T16:52:50.305Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"Merge pull request #9 from lucidrains/paper-variation\n\ncleanup","shortMessageHtmlLink":"Merge pull request #9 from lucidrains/paper-variation"}},{"before":null,"after":"46d3f147d5f01f038bf8ff526d9a193079e6e5ff","ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:40:21.742Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"cleanup","shortMessageHtmlLink":"cleanup"}},{"before":"0277167a2bf714478e328c5d6ced6b62be1331a6","after":null,"ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:30:36.839Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"}},{"before":"cdfa143e426367da4bb9383b1787477ac0b4d2aa","after":"fe82b1df7185679a80e606ee326657460d0f2f16","ref":"refs/heads/main","pushedAt":"2023-05-29T16:27:22.431Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"Merge pull request #8 from lucidrains/paper-variation\n\nPaper variation","shortMessageHtmlLink":"Merge pull request #8 from lucidrains/paper-variation"}},{"before":"ede6166ddb1e8ea4f7df2c9caa3ce789c893420e","after":"0277167a2bf714478e328c5d6ced6b62be1331a6","ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:27:08.132Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"fix and release 0.1.0","shortMessageHtmlLink":"fix and release 0.1.0"}},{"before":"cdfa143e426367da4bb9383b1787477ac0b4d2aa","after":"ede6166ddb1e8ea4f7df2c9caa3ce789c893420e","ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:02:34.632Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"the paper did multiple start tokens and also had last hierarchy project and unpixel shuffle a patch which they summed to the entire next patch","shortMessageHtmlLink":"the paper did multiple start tokens and also had last hierarchy proje…"}},{"before":null,"after":"cdfa143e426367da4bb9383b1787477ac0b4d2aa","ref":"refs/heads/paper-variation","pushedAt":"2023-05-29T16:02:02.689Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add beartype","shortMessageHtmlLink":"add beartype"}},{"before":"4f8ed9ba5589f6464b5f4ecba57b01826e9734d4","after":"cdfa143e426367da4bb9383b1787477ac0b4d2aa","ref":"refs/heads/main","pushedAt":"2023-05-26T17:07:22.767Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add beartype","shortMessageHtmlLink":"add beartype"}},{"before":"01536da7a8adea92a4af116c7f818dce96484d04","after":"4f8ed9ba5589f6464b5f4ecba57b01826e9734d4","ref":"refs/heads/main","pushedAt":"2023-05-26T16:56:16.398Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add beartype","shortMessageHtmlLink":"add beartype"}},{"before":"60995d14456ca9c8d3812012259c5a2b21605594","after":"01536da7a8adea92a4af116c7f818dce96484d04","ref":"refs/heads/main","pushedAt":"2023-05-26T16:47:56.079Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add beartype","shortMessageHtmlLink":"add beartype"}},{"before":"3b29e66ab4ef6b004c19ee3fc13368995e794ba9","after":"60995d14456ca9c8d3812012259c5a2b21605594","ref":"refs/heads/main","pushedAt":"2023-05-26T16:46:27.975Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"allow for smaller model dimensions for the finer hierarchical stages","shortMessageHtmlLink":"allow for smaller model dimensions for the finer hierarchical stages"}},{"before":"768eb9ae3d6477163089c48a6a90462f1779e058","after":"3b29e66ab4ef6b004c19ee3fc13368995e794ba9","ref":"refs/heads/main","pushedAt":"2023-05-26T16:45:56.697Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"allow for smaller model dimensions for the finer hierarchical stages","shortMessageHtmlLink":"allow for smaller model dimensions for the finer hierarchical stages"}},{"before":"2355831b529a53ee83991f7161f804c5bdc578eb","after":"768eb9ae3d6477163089c48a6a90462f1779e058","ref":"refs/heads/main","pushedAt":"2023-05-26T16:45:08.538Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"allow for smaller model dimensions for the finer hierarchical stages","shortMessageHtmlLink":"allow for smaller model dimensions for the finer hierarchical stages"}},{"before":"6a684daa25e15def380baa68278920a7de6b04aa","after":"2355831b529a53ee83991f7161f804c5bdc578eb","ref":"refs/heads/main","pushedAt":"2023-05-17T14:14:25.953Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add token shift from rwkv","shortMessageHtmlLink":"add token shift from rwkv"}},{"before":"bce8b329036f87c8f3876c951b568054bcdf9566","after":"6a684daa25e15def380baa68278920a7de6b04aa","ref":"refs/heads/main","pushedAt":"2023-05-16T17:31:20.458Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"readme","shortMessageHtmlLink":"readme"}},{"before":"18318dab74883f7b1f2cf6d1d353fb1264213fb1","after":"bce8b329036f87c8f3876c951b568054bcdf9566","ref":"refs/heads/main","pushedAt":"2023-05-16T15:35:57.758Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"always use flash attention","shortMessageHtmlLink":"always use flash attention"}},{"before":"c047f2f59113f3b0702cbb500207ceffc57dc4d7","after":"18318dab74883f7b1f2cf6d1d353fb1264213fb1","ref":"refs/heads/main","pushedAt":"2023-05-16T15:31:23.114Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"demonstrate on enwik8","shortMessageHtmlLink":"demonstrate on enwik8"}},{"before":"4c3ec34def59abde2651689da4d6c358eec2f8c7","after":"c047f2f59113f3b0702cbb500207ceffc57dc4d7","ref":"refs/heads/main","pushedAt":"2023-05-16T00:09:25.371Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"credit assign","shortMessageHtmlLink":"credit assign"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEsXAV-AA","startCursor":null,"endCursor":null}},"title":"Activity · lucidrains/MEGABYTE-pytorch"}