{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":582822129,"defaultBranch":"master","name":"nanoGPT","ownerLogin":"karpathy","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2022-12-28T00:51:12.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/241138?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1674845658.5043619","currentOid":""},"activityList":{"items":[{"before":"a022d02ee2e9624d721ca9dc8031eb7597e9d591","after":"325be85d9be8c81b436728a420e85796c57dba7e","ref":"refs/heads/master","pushedAt":"2024-02-27T17:27:01.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #420 from vinjn/fix-371-enc-is-not-defined\n\nMove enc to gloabal namespace to fix #371","shortMessageHtmlLink":"Merge pull request #420 from vinjn/fix-371-enc-is-not-defined"}},{"before":"f68ac2200df82d59a1b916fb8236b4b8bc68baa7","after":"a022d02ee2e9624d721ca9dc8031eb7597e9d591","ref":"refs/heads/master","pushedAt":"2024-02-27T17:05:44.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #429 from adambala/fixes\n\nOpen \"shakespeare\" data in UTF-8 in \"prepare.py\"","shortMessageHtmlLink":"Merge pull request #429 from adambala/fixes"}},{"before":"eba36e84649f3c6d840a93092cb779a260544d08","after":"f68ac2200df82d59a1b916fb8236b4b8bc68baa7","ref":"refs/heads/master","pushedAt":"2024-02-27T16:41:24.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #428 from kjslag/memmap-memory-leak\n\nfix np.memmap memory leak","shortMessageHtmlLink":"Merge pull request #428 from kjslag/memmap-memory-leak"}},{"before":"4eb7a96b077998f28b57938c2f1e511b0d8cab7c","after":"eba36e84649f3c6d840a93092cb779a260544d08","ref":"refs/heads/master","pushedAt":"2023-06-22T15:24:17.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #309 from ho2103/master\n\nFix AssertionError on macOS - need to check CUDA availability for bf16","shortMessageHtmlLink":"Merge pull request #309 from ho2103/master"}},{"before":"41d7014f7d4654af1f7dae35cb267206fcabf41f","after":"4eb7a96b077998f28b57938c2f1e511b0d8cab7c","ref":"refs/heads/master","pushedAt":"2023-06-18T03:26:35.532Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #305 from okuvshynov/fix_osx_dataload\n\nnanogpt: fix multiprocessing in load_dataset on os x","shortMessageHtmlLink":"Merge pull request #305 from okuvshynov/fix_osx_dataload"}},{"before":"7339b904ef0bb8f4dcc88e4d602c04271697279f","after":"41d7014f7d4654af1f7dae35cb267206fcabf41f","ref":"refs/heads/master","pushedAt":"2023-06-17T01:30:03.666Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #301 from okuvshynov/master\n\n[easy] allow multithreading in load_dataset","shortMessageHtmlLink":"Merge pull request #301 from okuvshynov/master"}},{"before":"f08abb45bd2285627d17da16daea14dda7e7253e","after":"7339b904ef0bb8f4dcc88e4d602c04271697279f","ref":"refs/heads/master","pushedAt":"2023-06-14T23:33:10.985Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"use WORLD_SIZE instead of device_count, supports both the case where the number of gpus we train on is smaller than gpus available, and also multinode training may be a bugfix","shortMessageHtmlLink":"use WORLD_SIZE instead of device_count, supports both the case where …"}},{"before":"18ee6b62b669fc3a62c540c13607b3cc0107b51d","after":"f08abb45bd2285627d17da16daea14dda7e7253e","ref":"refs/heads/master","pushedAt":"2023-06-14T23:25:15.466Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #274 from apivovarov/gelu\n\nUse nn.GELU - 1.27x faster training","shortMessageHtmlLink":"Merge pull request #274 from apivovarov/gelu"}},{"before":"ed7887c888270d9b7724556658c1e2bf0e0b628e","after":"18ee6b62b669fc3a62c540c13607b3cc0107b51d","ref":"refs/heads/master","pushedAt":"2023-06-14T22:38:46.046Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #275 from apivovarov/rm_unsqueeze\n\nRemove pos unsqueeze(0)","shortMessageHtmlLink":"Merge pull request #275 from apivovarov/rm_unsqueeze"}},{"before":"8020bb582bcac47269700978759f7e2b739b946e","after":"ed7887c888270d9b7724556658c1e2bf0e0b628e","ref":"refs/heads/master","pushedAt":"2023-06-14T22:36:26.786Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #270 from LaihoE/master\n\nfix np.sum overflows on windows","shortMessageHtmlLink":"Merge pull request #270 from LaihoE/master"}},{"before":"0f06d9b8899f10078b410cc3d1c37634a167eb6d","after":"8020bb582bcac47269700978759f7e2b739b946e","ref":"refs/heads/master","pushedAt":"2023-06-14T22:30:39.217Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #276 from apivovarov/gitign\n\nAdd more files to .gitignore","shortMessageHtmlLink":"Merge pull request #276 from apivovarov/gitign"}},{"before":"cf4835ed6f9b2ed1eae04a57c7ff6bb073bed9f0","after":"0f06d9b8899f10078b410cc3d1c37634a167eb6d","ref":"refs/heads/master","pushedAt":"2023-06-14T22:29:50.876Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #277 from apivovarov/is_bf16_supported\n\nUse bf16 only if supported","shortMessageHtmlLink":"Merge pull request #277 from apivovarov/is_bf16_supported"}},{"before":"7fe4a099ad2a4654f96a51c0736ecf347149c34c","after":"cf4835ed6f9b2ed1eae04a57c7ff6bb073bed9f0","ref":"refs/heads/master","pushedAt":"2023-06-14T22:21:04.850Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #286 from ctjlewis/master\n\ndocs: simplify dependencies installation","shortMessageHtmlLink":"Merge pull request #286 from ctjlewis/master"}},{"before":"196160b849eaed4465310c082db2c9dc7bc11ba9","after":"7fe4a099ad2a4654f96a51c0736ecf347149c34c","ref":"refs/heads/master","pushedAt":"2023-05-06T14:43:57.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"simplify configure_optimizers by a lot","shortMessageHtmlLink":"simplify configure_optimizers by a lot"}},{"before":"21f9bff7e40d0918cd1dcda7373e686b4ec239fa","after":"196160b849eaed4465310c082db2c9dc7bc11ba9","ref":"refs/heads/master","pushedAt":"2023-04-18T03:16:32.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #247 from gnobre/macbook-run-instructions\n\nMacbook run instructions","shortMessageHtmlLink":"Merge pull request #247 from gnobre/macbook-run-instructions"}},{"before":"d9f4735f5e09c6faf3cf1f813d61a609e52a24b3","after":"21f9bff7e40d0918cd1dcda7373e686b4ec239fa","ref":"refs/heads/master","pushedAt":"2023-04-18T03:11:25.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #225 from otaviogood/grad_accum\n\nFix for gradient_accumulation_steps training slow","shortMessageHtmlLink":"Merge pull request #225 from otaviogood/grad_accum"}},{"before":"b288f4cfb2b50f05d795df351ac12bdb48363c42","after":"d9f4735f5e09c6faf3cf1f813d61a609e52a24b3","ref":"refs/heads/master","pushedAt":"2023-04-13T07:39:41.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #10 from LaihoE/master\n\nbatch file write","shortMessageHtmlLink":"Merge pull request #10 from LaihoE/master"}},{"before":"079df20748cc9fc08bf5715dcb0a0d5ea338b297","after":"b288f4cfb2b50f05d795df351ac12bdb48363c42","ref":"refs/heads/master","pushedAt":"2023-04-13T05:48:37.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #146 from lutzroeder/master\n\nAdd .gitignore","shortMessageHtmlLink":"Merge pull request #146 from lutzroeder/master"}},{"before":"01e48ec1ab8c87a40bbf1495b58e232629d90b88","after":"079df20748cc9fc08bf5715dcb0a0d5ea338b297","ref":"refs/heads/master","pushedAt":"2023-04-13T05:45:01.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #74 from venusatuluri/fix_decode\n\nSmall fix to decode fn in shakespeare_char/prepare.py","shortMessageHtmlLink":"Merge pull request #74 from venusatuluri/fix_decode"}},{"before":"7840a668597e68915aa4415a780ee676cb4d9d1b","after":"01e48ec1ab8c87a40bbf1495b58e232629d90b88","ref":"refs/heads/master","pushedAt":"2023-04-13T05:43:59.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #240 from YassineYousfi/master\n\ndon't dropout in eval mode","shortMessageHtmlLink":"Merge pull request #240 from YassineYousfi/master"}},{"before":"8abe215fbab57162d4b090b2ed652a4109c0ab28","after":"7840a668597e68915aa4415a780ee676cb4d9d1b","ref":"refs/heads/master","pushedAt":"2023-04-13T05:25:18.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #54 from MicroPanda123/luv\n\nGive tqdm some love :)","shortMessageHtmlLink":"Merge pull request #54 from MicroPanda123/luv"}},{"before":"ad62003d7a2ae969d5b457ebd9435334e935abf1","after":"8abe215fbab57162d4b090b2ed652a4109c0ab28","ref":"refs/heads/master","pushedAt":"2023-04-13T05:24:41.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #128 from abrahamsangha/fix-typo\n\nfix typo","shortMessageHtmlLink":"Merge pull request #128 from abrahamsangha/fix-typo"}},{"before":"ea24604b2949494a8864e01bcb90a0f926908be4","after":"ad62003d7a2ae969d5b457ebd9435334e935abf1","ref":"refs/heads/master","pushedAt":"2023-04-13T05:24:06.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #142 from kovkev/patch-1\n\nFix the position of a comma","shortMessageHtmlLink":"Merge pull request #142 from kovkev/patch-1"}},{"before":"8aeea6d9707c9e547a1bcb22f33255c64cb7f065","after":"ea24604b2949494a8864e01bcb90a0f926908be4","ref":"refs/heads/master","pushedAt":"2023-04-13T05:13:01.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #220 from python273/patch-1\n\nFix GPT.crop_block_size when flash attention is available","shortMessageHtmlLink":"Merge pull request #220 from python273/patch-1"}},{"before":"2457471c9c2d94acc698097326c5d555be06923b","after":"8aeea6d9707c9e547a1bcb22f33255c64cb7f065","ref":"refs/heads/master","pushedAt":"2023-04-13T05:12:26.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #224 from SnehalRaj/patch-1\n\nfix small typo","shortMessageHtmlLink":"Merge pull request #224 from SnehalRaj/patch-1"}},{"before":"553f949f46e04a946e5ff2da6e4bb70a221ea1fc","after":"2457471c9c2d94acc698097326c5d555be06923b","ref":"refs/heads/master","pushedAt":"2023-04-13T05:09:42.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #236 from ymurenko/master\n\nfix \"cuda out of memory\" when resuming training","shortMessageHtmlLink":"Merge pull request #236 from ymurenko/master"}},{"before":"a82b33b525ca9855d705656387698e13eb8e8d4b","after":"553f949f46e04a946e5ff2da6e4bb70a221ea1fc","ref":"refs/heads/master","pushedAt":"2023-04-13T04:59:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"fix minor bug where we have to scale the loss to account for gradient accumulation, which sums before backprop. note that this is not a major bug because AdamW is scale invariant. however, this did affect gradient clipping","shortMessageHtmlLink":"fix minor bug where we have to scale the loss to account for gradient…"}},{"before":"0d8fbd11aed59617f65d2bbd14842b4050516128","after":"a82b33b525ca9855d705656387698e13eb8e8d4b","ref":"refs/heads/master","pushedAt":"2023-03-12T20:40:20.728Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"karpathy","name":"Andrej","path":"/karpathy","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/241138?s=80&v=4"},"commit":{"message":"Merge pull request #199 from ChristianOrr/patch-1\n\nbugfix in decode function","shortMessageHtmlLink":"Merge pull request #199 from ChristianOrr/patch-1"}}],"hasNextPage":false,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEBsu6yQA","startCursor":null,"endCursor":null}},"title":"Activity · karpathy/nanoGPT"}