{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":674841239,"defaultBranch":"main","name":"soft-moe-pytorch","ownerLogin":"lucidrains","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-08-04T23:46:54.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/108653?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1713972225.0","currentOid":""},"activityList":{"items":[{"before":"e36ce953f85d0b39037b4e9d8016c1519368f2f4","after":"a0d8a4e5481d896da945ebc2c6c800ebf4c7f138","ref":"refs/heads/main","pushedAt":"2024-04-24T15:23:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"address https://github.com/lucidrains/soft-moe-pytorch/issues/7","shortMessageHtmlLink":"address #7"}},{"before":"a39d1472f2eb1d5d9dbcefb64fa46fadeafa5a15","after":"e36ce953f85d0b39037b4e9d8016c1519368f2f4","ref":"refs/heads/main","pushedAt":"2024-02-29T15:33:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"remove erroneous split by rank backwards","shortMessageHtmlLink":"remove erroneous split by rank backwards"}},{"before":"e1dc178bd7d54c9162b72a1a2c470d7b7c964497","after":"a39d1472f2eb1d5d9dbcefb64fa46fadeafa5a15","ref":"refs/heads/main","pushedAt":"2024-02-18T17:59:46.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"prepare for use in soft-actor-critic value network, given new deepmind paper https://github.com/lucidrains/SAC-pytorch","shortMessageHtmlLink":"prepare for use in soft-actor-critic value network, given new deepmin…"}},{"before":"4dc07b0d7ebc128e330cefc98af171c557b3a143","after":"e1dc178bd7d54c9162b72a1a2c470d7b7c964497","ref":"refs/heads/main","pushedAt":"2024-01-04T14:32:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add option to use layernorm instead of rmsnorm","shortMessageHtmlLink":"add option to use layernorm instead of rmsnorm"}},{"before":"17e4d2c36ff080c2fc5cd5ee277c56e17fe4ae54","after":"4dc07b0d7ebc128e330cefc98af171c557b3a143","ref":"refs/heads/main","pushedAt":"2023-12-18T17:46:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"expose an extra flag","shortMessageHtmlLink":"expose an extra flag"}},{"before":"8c3fedbb92e9c98ed6bd6e80a797fa4c2f14b32c","after":"17e4d2c36ff080c2fc5cd5ee277c56e17fe4ae54","ref":"refs/heads/main","pushedAt":"2023-12-14T20:12:41.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"another quick fix","shortMessageHtmlLink":"another quick fix"}},{"before":"0588603367c36644f72a92401143f7758841f599","after":"8c3fedbb92e9c98ed6bd6e80a797fa4c2f14b32c","ref":"refs/heads/main","pushedAt":"2023-12-14T20:03:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add a contiguous, thanks to @conceptofmind","shortMessageHtmlLink":"add a contiguous, thanks to @conceptofmind"}},{"before":"cdefb4388fd594de94820dc6087b832b260bd40a","after":"0588603367c36644f72a92401143f7758841f599","ref":"refs/heads/main","pushedAt":"2023-09-21T15:51:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"add ability to noise gates and anneal noise","shortMessageHtmlLink":"add ability to noise gates and anneal noise"}},{"before":"fb138b124bb68baff7af5c375d703a096e462458","after":"cdefb4388fd594de94820dc6087b832b260bd40a","ref":"refs/heads/main","pushedAt":"2023-09-10T20:15:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"just port over some logic from st moe","shortMessageHtmlLink":"just port over some logic from st moe"}},{"before":"55c4a7b93f0170c25259494d3e7a16eaedff314c","after":"fb138b124bb68baff7af5c375d703a096e462458","ref":"refs/heads/main","pushedAt":"2023-09-10T17:00:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"quick fix","shortMessageHtmlLink":"quick fix"}},{"before":"9811bfbaf0144a5d75e80737ea2942cc922e2eb3","after":"55c4a7b93f0170c25259494d3e7a16eaedff314c","ref":"refs/heads/main","pushedAt":"2023-09-09T17:20:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"project management","shortMessageHtmlLink":"project management"}},{"before":"347f8ef316a3f3689f408650ab44d824a17b59de","after":"9811bfbaf0144a5d75e80737ea2942cc922e2eb3","ref":"refs/heads/main","pushedAt":"2023-09-09T16:57:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"remove wip, project management","shortMessageHtmlLink":"remove wip, project management"}},{"before":"a3c801d5af31a64990c7583cae59050b632fa375","after":"347f8ef316a3f3689f408650ab44d824a17b59de","ref":"refs/heads/main","pushedAt":"2023-09-09T15:54:40.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"naive distributed code","shortMessageHtmlLink":"naive distributed code"}},{"before":"6d547e5d7f67ee554aba12e5c5c4af734a1cb5de","after":"a3c801d5af31a64990c7583cae59050b632fa375","ref":"refs/heads/main","pushedAt":"2023-09-09T15:53:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"move all experts to cpu besides those that the machine is responsible for","shortMessageHtmlLink":"move all experts to cpu besides those that the machine is responsible…"}},{"before":"e80947ba08124ea53e85903ce84ab90c623d9c85","after":"6d547e5d7f67ee554aba12e5c5c4af734a1cb5de","ref":"refs/heads/main","pushedAt":"2023-08-16T15:26:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"thoughts","shortMessageHtmlLink":"thoughts"}},{"before":"3af90867d33524205783fb70beae2b76a3004598","after":"e80947ba08124ea53e85903ce84ab90c623d9c85","ref":"refs/heads/main","pushedAt":"2023-08-15T23:01:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"for dynamic slots, need to mask out slots too, in the case of variable lengthed sequences","shortMessageHtmlLink":"for dynamic slots, need to mask out slots too, in the case of variabl…"}},{"before":"05c1689369e19529b9fbc10aef08123e16430a31","after":"3af90867d33524205783fb70beae2b76a3004598","ref":"refs/heads/main","pushedAt":"2023-08-15T18:33:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"credit assignment","shortMessageHtmlLink":"credit assignment"}},{"before":"c32ed28f0eaf69a74dccde483fafc595d3d1eaae","after":"05c1689369e19529b9fbc10aef08123e16430a31","ref":"refs/heads/main","pushedAt":"2023-08-15T18:31:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"improvise a variant that calculate dynamic number of slots","shortMessageHtmlLink":"improvise a variant that calculate dynamic number of slots"}},{"before":"a505e509c745270f4996aa2a317856bd7c69abe1","after":"c32ed28f0eaf69a74dccde483fafc595d3d1eaae","ref":"refs/heads/main","pushedAt":"2023-08-14T03:46:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"account for key-padding mask","shortMessageHtmlLink":"account for key-padding mask"}},{"before":"2dbae8ac134ee49afeb1723aa0998d8395912544","after":"a505e509c745270f4996aa2a317856bd7c69abe1","ref":"refs/heads/main","pushedAt":"2023-08-11T21:38:02.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"0.0.3","shortMessageHtmlLink":"0.0.3"}},{"before":"66966beb26c154bb131beb46f177db9424d9c989","after":"2dbae8ac134ee49afeb1723aa0998d8395912544","ref":"refs/heads/main","pushedAt":"2023-08-11T16:14:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"research management","shortMessageHtmlLink":"research management"}},{"before":"9f712b892b8cf1d500ff7acd9ab5ffa073e3c91a","after":"66966beb26c154bb131beb46f177db9424d9c989","ref":"refs/heads/main","pushedAt":"2023-08-10T21:55:22.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"accept image fmaps","shortMessageHtmlLink":"accept image fmaps"}},{"before":"6a243048aa62e5c9157c7478bb6134aa89261de8","after":"9f712b892b8cf1d500ff7acd9ab5ffa073e3c91a","ref":"refs/heads/main","pushedAt":"2023-08-10T20:33:54.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"readme","shortMessageHtmlLink":"readme"}},{"before":"5268a86f886a58e2300c61a4c504c72dc292dd56","after":"6a243048aa62e5c9157c7478bb6134aa89261de8","ref":"refs/heads/main","pushedAt":"2023-08-10T20:32:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"complete the basic idea for soft moe, including the l2norm w/ scale","shortMessageHtmlLink":"complete the basic idea for soft moe, including the l2norm w/ scale"}},{"before":"9313c23028f05132980655e63956855d7c6adbdd","after":"5268a86f886a58e2300c61a4c504c72dc292dd56","ref":"refs/heads/main","pushedAt":"2023-08-10T17:40:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"more scaffold","shortMessageHtmlLink":"more scaffold"}},{"before":"90785e38a5986d9a9f9aec7418236d3f32890176","after":"9313c23028f05132980655e63956855d7c6adbdd","ref":"refs/heads/main","pushedAt":"2023-08-05T15:44:46.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"thoughts","shortMessageHtmlLink":"thoughts"}},{"before":"96e69f98afe0a3a15625afc70c76db2e08d55270","after":"90785e38a5986d9a9f9aec7418236d3f32890176","ref":"refs/heads/main","pushedAt":"2023-08-05T15:44:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"thoughts","shortMessageHtmlLink":"thoughts"}},{"before":"b35b516f004f5b7a4af34e308c21b26096f87ae4","after":"96e69f98afe0a3a15625afc70c76db2e08d55270","ref":"refs/heads/main","pushedAt":"2023-08-05T15:40:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"scaffold","shortMessageHtmlLink":"scaffold"}},{"before":null,"after":"b35b516f004f5b7a4af34e308c21b26096f87ae4","ref":"refs/heads/main","pushedAt":"2023-08-04T23:46:54.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"lucidrains","name":"Phil Wang","path":"/lucidrains","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/108653?s=80&v=4"},"commit":{"message":"Initial commit","shortMessageHtmlLink":"Initial commit"}}],"hasNextPage":false,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEOUkBuwA","startCursor":null,"endCursor":null}},"title":"Activity · lucidrains/soft-moe-pytorch"}