{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":512834024,"defaultBranch":"main","name":"mttl","ownerLogin":"microsoft","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2022-07-11T16:36:53.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/6154722?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1715282170.0","currentOid":""},"activityList":{"items":[{"before":"0b0d5c1216d42782cbd91382ea8fb04c57aa0399","after":"7dd2037a4f9af9ed9655901b5911eff674d274cc","ref":"refs/heads/zs_code","pushedAt":"2024-05-25T20:02:13.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"add zero_shot","shortMessageHtmlLink":"add zero_shot"}},{"before":"f70e47df1ec64f47d173523003384b6f8e88d8de","after":"0b0d5c1216d42782cbd91382ea8fb04c57aa0399","ref":"refs/heads/zs_code","pushedAt":"2024-05-23T16:59:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"fix zero_shot","shortMessageHtmlLink":"fix zero_shot"}},{"before":"659a28e5e2d2b013bab14b8c1fa9a8db372aeacf","after":null,"ref":"refs/heads/dependabot/pip/pytorch-lightning-2.0.6","pushedAt":"2024-05-09T19:16:10.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"dependabot[bot]","name":null,"path":"/apps/dependabot","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/29110?s=80&v=4"}},{"before":"d71991df128e052064b3ac9bf707102f254eff17","after":null,"ref":"refs/heads/dependabot/pip/transformers-4.36.0","pushedAt":"2024-05-09T19:14:56.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"dependabot[bot]","name":null,"path":"/apps/dependabot","primaryAvatarUrl":"https://avatars.githubusercontent.com/in/29110?s=80&v=4"}},{"before":"e377c331a332bb88359d3aef8b15949292d14a09","after":null,"ref":"refs/heads/requirements_update","pushedAt":"2024-05-09T19:14:04.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"}},{"before":"1ebf884b0b6d98031d1548809a7f919c39f6ac36","after":"d00ff7627e502961a8ad1aee10a16a47f1c63632","ref":"refs/heads/main","pushedAt":"2024-05-09T19:13:55.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"requirements update (#51)","shortMessageHtmlLink":"requirements update (#51)"}},{"before":null,"after":"e377c331a332bb88359d3aef8b15949292d14a09","ref":"refs/heads/requirements_update","pushedAt":"2024-05-09T18:52:15.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"requirements update","shortMessageHtmlLink":"requirements update"}},{"before":"8965e769fdffe61c633cbd8dbc7170915e6da75c","after":"1ebf884b0b6d98031d1548809a7f919c39f6ac36","ref":"refs/heads/main","pushedAt":"2024-05-09T18:38:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"setup-python v5 and cache pip","shortMessageHtmlLink":"setup-python v5 and cache pip"}},{"before":"80ee439b77bdab47bce11de45f4997a4128d3dec","after":null,"ref":"refs/heads/codeql_update","pushedAt":"2024-05-09T18:29:08.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"}},{"before":"ce4ca51dbca73be656feb9b3e5233633e3c5dec7","after":"8965e769fdffe61c633cbd8dbc7170915e6da75c","ref":"refs/heads/main","pushedAt":"2024-05-09T18:29:03.000Z","pushType":"pr_merge","commitsCount":1,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"Update codeql.yml (#50)\n\n* Update codeql.yml\r\n\r\n* Update tests.yml","shortMessageHtmlLink":"Update codeql.yml (#50)"}},{"before":"bde30d83bf4bbf74cd089ae4c516f1a9b20cfb6c","after":null,"ref":"refs/heads/codeql","pushedAt":"2024-05-09T18:25:12.000Z","pushType":"branch_deletion","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"}},{"before":"499e28acbd3284fd527cb7e43dd566e75aa64e06","after":"80ee439b77bdab47bce11de45f4997a4128d3dec","ref":"refs/heads/codeql_update","pushedAt":"2024-05-09T18:14:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"Update tests.yml","shortMessageHtmlLink":"Update tests.yml"}},{"before":null,"after":"499e28acbd3284fd527cb7e43dd566e75aa64e06","ref":"refs/heads/codeql_update","pushedAt":"2024-05-09T17:45:42.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"Update codeql.yml","shortMessageHtmlLink":"Update codeql.yml"}},{"before":null,"after":"bde30d83bf4bbf74cd089ae4c516f1a9b20cfb6c","ref":"refs/heads/codeql","pushedAt":"2024-05-09T17:42:23.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"Update codeql.yml","shortMessageHtmlLink":"Update codeql.yml"}},{"before":"5f6573b6822e59e151b839f05575f1ea08cb7f62","after":"f70e47df1ec64f47d173523003384b6f8e88d8de","ref":"refs/heads/zs_code","pushedAt":"2024-05-09T09:43:36.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"rewrite dora","shortMessageHtmlLink":"rewrite dora"}},{"before":"8255d617c71c0bd3205ce8b8e222d71194365095","after":"5f6573b6822e59e151b839f05575f1ea08cb7f62","ref":"refs/heads/zs_code","pushedAt":"2024-04-24T16:31:23.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"add dora","shortMessageHtmlLink":"add dora"}},{"before":"f2a2ae9b1a2aa3bb788a96a1d7f26cfc624d6de2","after":"8255d617c71c0bd3205ce8b8e222d71194365095","ref":"refs/heads/zs_code","pushedAt":"2024-04-01T17:34:18.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"add draw notebook","shortMessageHtmlLink":"add draw notebook"}},{"before":"3a9d315327411eaf77e91cea9eb149a0758f83f3","after":"f2a2ae9b1a2aa3bb788a96a1d7f26cfc624d6de2","ref":"refs/heads/zs_code","pushedAt":"2024-02-21T19:58:49.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"did not remove the checkpoint","shortMessageHtmlLink":"did not remove the checkpoint"}},{"before":"4b018a85bbc3393a48e733a45ce92ebfdde5a06a","after":"3a9d315327411eaf77e91cea9eb149a0758f83f3","ref":"refs/heads/zs_code","pushedAt":"2024-02-19T18:03:31.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"shuishen112","name":"Zhan Su","path":"/shuishen112","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/10068278?s=80&v=4"},"commit":{"message":"fix for tensorpoly-I, the order should be used not n_split for tensorpoly-I","shortMessageHtmlLink":"fix for tensorpoly-I, the order should be used not n_split for tensor…"}},{"before":null,"after":"c66b20d69978428e06ea37246b9025204b82381c","ref":"refs/heads/mhr_camera_ready","pushedAt":"2024-02-14T13:47:11.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"matheper","name":"Matheus Pereira","path":"/matheper","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/1433862?s=80&v=4"},"commit":{"message":"MHR camera ready. Squashed commit of the following:\n\ncommit 678ef97debe75712b21798ca57d8b70b31831049\nAuthor: Lucas Page-Caccia \nDate: Thu Oct 19 16:47:48 2023 -0700\n\n make lora like poly\n\ncommit 0024b1d6b92b4875e4f421921989b875355a6843\nAuthor: Lucas Page-Caccia \nDate: Thu Oct 19 16:47:24 2023 -0700\n\n lora pretrain using actual lora\n\ncommit c8b82890834b0073c28d5f96ed09b1a3daeb09f7\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 20:49:24 2023 -0700\n\n load from hf for mtl pretraining\n\ncommit 9b9e1baf5ee0ebc9a757c963f440000d0778c7e9\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 20:46:11 2023 -0700\n\n support to load from huggingface\n\ncommit 04c8b1c0bf84a7f9daaa6d6438c8eb31d7b5d187\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:49:36 2023 -0700\n\n configs\n\ncommit 22c9e72f3668489157189c5febc90cc02f19c5eb\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:49:06 2023 -0700\n\n update config\n\ncommit 0be0c81d5f41b1158d323d3a1dc137703fb040f7\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:48:19 2023 -0700\n\n cleanup\n\ncommit efb82b24465c6cce299d1fd1610cbb8dea23e360\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:47:41 2023 -0700\n\n cleanup default strategy\n\ncommit f68217ace6e73efa9ec0683cafbe99e9c1e59146\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:47:24 2023 -0700\n\n handle formatting or precision in config\n\ncommit 3098f798cd85276474f3546f0faa95e4e98e374a\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 14:23:17 2023 -0700\n\n cleanup compute_strategy mess\n\ncommit cac44f1951f1dd9783089a17c91faad8fcb13fd8\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 12:35:35 2023 -0700\n\n WANDB default name\n\ncommit cd5d85458a6ef42c24348ffa404839487d5d6707\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 08:02:26 2023 -0700\n\n properly log annealing coefficient\n\ncommit 797ffbd8e91d496a348f120260fe7f8c68beb050\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 18 08:02:08 2023 -0700\n\n remove the sadness and sorrow that is `mlflowlogger`.\n\ncommit fafd39833c04d92ab7464b4d5c72dc87706a1345\nAuthor: Lucas Page-Caccia \nDate: Tue Oct 10 07:54:11 2023 -0700\n\n rename prob. container for `AverageSelector`, to avoid size mismatch when loading checkpoint with other selector\n\ncommit 489d210e616e1d0030f770669b2e552a95c53085\nAuthor: Lucas Page-Caccia \nDate: Mon Oct 9 19:25:16 2023 -0700\n\n verbose\n\ncommit f1b1db145c18c61d51b9c1af0ec7c63921b185c9\nAuthor: Lucas Page-Caccia \nDate: Mon Oct 9 18:39:55 2023 -0700\n\n also process zero shot results\n\ncommit 6756dc44d5e8db1a87bca2eef0048037e7371a1b\nAuthor: Lucas Page-Caccia \nDate: Mon Oct 9 13:47:03 2023 -0700\n\n cleanup\n\ncommit a855510b0cddb87ad41c15a0bc15a1900c73658a\nAuthor: Lucas Page-Caccia \nDate: Mon Oct 9 11:18:26 2023 -0700\n\n zero shot scripts for mhr\n\ncommit 2b4cab5cb0f97fba0d56d2a041f6e0f0df1d2cba\nAuthor: Lucas Page-Caccia \nDate: Mon Oct 9 11:09:43 2023 -0700\n\n finetuning* of pretrained model for zeroshot enabling\n\ncommit 463dcba1bd3f08682b3bea0985304bd1a78344d5\nAuthor: Lucas Page-Caccia \nDate: Sun Oct 8 18:23:33 2023 -0700\n\n fixed results processing\n\ncommit 7dc149bb85e771fe46c48404ed1f563b6467628e\nAuthor: Lucas Page-Caccia \nDate: Fri Oct 6 14:11:03 2023 -0700\n\n enable annealing back to uniform during training\n\ncommit 4bae8768c3c66d7933e828447d3d6605522c97f2\nAuthor: Lucas Page-Caccia \nDate: Thu Oct 5 10:22:44 2023 -0700\n\n set precision to `medium` and print arguments\n\ncommit 7965f6af85c3b02237a2c2bd94e6f8803f6d0d0f\nAuthor: Lucas Page-Caccia \nDate: Thu Oct 5 10:20:53 2023 -0700\n\n fetch `finish.pt` if available\n\ncommit d27eb9777a795ddc831153dbe6c901f020b1fdd4\nMerge: d437cb0 e6ddc05\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 4 07:42:07 2023 -0700\n\n Merge branch 'platypus' of github.com:pclucas14/lucas_mttl into platypus\n\ncommit d437cb0b79842774e1c8386e9934cad9b665287d\nAuthor: Lucas Page-Caccia \nDate: Wed Oct 4 07:41:57 2023 -0700\n\n added cache dir to CLM\n\ncommit e6ddc05af043aed0b46a6edb0771d7f7539e592d\nAuthor: Alessandro Sordoni \nDate: Fri Sep 22 10:35:05 2023 -0700\n\n put back \"Now complete the following...\"\n\ncommit 5b9f2f176e0d57622dd9904dd804580031713a9f\nAuthor: oleksost \nDate: Tue Sep 19 00:00:13 2023 +0000\n\n typing\n\ncommit 6bd4f22e7ec47d06cd538c71c8d48841ed9f4339\nAuthor: oleksost \nDate: Mon Sep 18 20:21:21 2023 +0000\n\n downstream eval + experts average eval\n\ncommit 187911da7569c5e1763491db0030f927aa27894a\nAuthor: oleksost \nDate: Mon Sep 18 19:57:47 2023 +0000\n\n switched to LLamaTokenizer from LlamaTokenizerFast\n\ncommit 38de4f4af7eee4762cd06cd30ff6459a39c10650\nAuthor: oleksost \nDate: Mon Sep 18 18:57:16 2023 +0000\n\n remove mini progress\n\ncommit c6d716899499533a6c6a01a12e67c8397213b67f\nAuthor: oleksost \nDate: Mon Sep 18 18:56:41 2023 +0000\n\n gaussian init hp\n\ncommit c44ade9c17c51d75a30617b9e91075cc936ff17d\nMerge: 7e57501 f7b6a5d\nAuthor: Oleksiy Ostapenko \nDate: Mon Sep 18 14:48:57 2023 -0400\n\n Merge pull request #29 from pclucas14/platypus_xr\n\n Platypus xr\n\ncommit f7b6a5d99d5cf8b14f1a828fa8a0eb32b404fdee\nAuthor: oleksost \nDate: Mon Sep 18 18:41:56 2023 +0000\n\n remove sni callback\n\ncommit f2657c6abf95331b8884108d2d4e95faa7620134\nAuthor: oleksost \nDate: Mon Sep 18 18:40:54 2023 +0000\n\n nvm\n\ncommit c6dc601ea96cefe9dc2bcaaf884e455406ebe3fc\nAuthor: oleksost \nDate: Mon Sep 18 18:40:36 2023 +0000\n\n nvm\n\ncommit 4ec807fa435d1421e52ba90c884ffb6e840a9ac7\nAuthor: oleksost \nDate: Mon Sep 18 18:38:38 2023 +0000\n\n formatting\n\ncommit 38df110ec5488aeb14ffa9f3128c0f4e973b8dfb\nAuthor: oleksost \nDate: Mon Sep 18 18:37:51 2023 +0000\n\n removed metrics.json\n\ncommit 0b048e1297929cffda2a647555c28b1da1518aeb\nAuthor: oleksost \nDate: Mon Sep 18 18:35:58 2023 +0000\n\n last comments\n\ncommit 8eb0fc82a5a99ec9f8441b7718a036f0f2a1ac33\nAuthor: oleksost \nDate: Mon Sep 18 18:25:57 2023 +0000\n\n gitignore\n\ncommit a1a6a3e39e0655ae3b496eb35188b07e1c312614\nAuthor: oleksost \nDate: Mon Sep 18 18:16:14 2023 +0000\n\n format\n\ncommit c85139c967228673ef05445ac4539017581ceb27\nAuthor: oleksost \nDate: Mon Sep 18 18:15:40 2023 +0000\n\n typing\n\ncommit e449d7afc579d867281d5a37fe57d0336b374ffd\nAuthor: oleksost \nDate: Mon Sep 18 17:50:03 2023 +0000\n\n formating\n\ncommit f838e0ea6ab6ab070fb5eba6f344c79e4a6f005b\nAuthor: oleksost \nDate: Mon Sep 18 17:46:39 2023 +0000\n\n clean\n\ncommit 18b7f4dc355aede16ad2b5a8ead73a04e33aac6f\nAuthor: oleksost \nDate: Mon Sep 18 17:38:34 2023 +0000\n\n clean\n\ncommit c47149ad4fc34a2a8d53fa6bb481080646d4974f\nAuthor: oleksost \nDate: Mon Sep 18 17:37:48 2023 +0000\n\n LlamaTokenizerFast\n\ncommit fc9ad4433917cbae1d78de2016b3f3551b58214c\nAuthor: oleksost \nDate: Mon Sep 18 17:36:43 2023 +0000\n\n clean\n\ncommit bc0ef84560b46eff8880911c52766cf563716adc\nAuthor: oleksost \nDate: Mon Sep 18 17:34:07 2023 +0000\n\n clean\n\ncommit 2f7adb8159a391ea3420923663ad6736bacfef2d\nMerge: ccf5646 7e57501\nAuthor: oleksost \nDate: Mon Sep 18 17:29:28 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit ccf56465d1ddbff4f029fac10b7cd684c80c7941\nAuthor: oleksost \nDate: Mon Sep 18 17:29:10 2023 +0000\n\n cleaning\n\ncommit 7e57501e33a816a16542b19d27222974cf1a8821\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 10:26:27 2023 -0700\n\n expert training gone\n\ncommit 099087df592d2d69099cb1058aacfe07ac64533d\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 10:26:01 2023 -0700\n\n remove experts-related files\n\ncommit 56ba17d8bf50c879c54b0767ef581a7a0b53a188\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 10:25:22 2023 -0700\n\n remove leaked files\n\ncommit 1c1762f8919edd96b751965eaca26a2338ea6828\nMerge: 6424154 348cf9a\nAuthor: Oleksiy Ostapenko \nDate: Mon Sep 18 13:21:49 2023 -0400\n\n Merge pull request #30 from pclucas14/fix-8bit-aux\n\n Fixes 8 bit auxiliary loss\n\ncommit b4a721a9df961341faf7d9fbd51311a11d4b3d42\nAuthor: oleksost \nDate: Mon Sep 18 17:19:06 2023 +0000\n\n removed dirichlet\n\ncommit 348cf9a84422bd136ca9b0acfbd7f4ff8a70392f\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 13:18:45 2023 -0400\n\n fix\n\ncommit 58fb9cca294e8f22e0164f8a3331277b257486d4\nAuthor: oleksost \nDate: Mon Sep 18 17:12:40 2023 +0000\n\n removed validate model\n\ncommit b833c90a0010b453613453dbd5dc148782e8ad78\nAuthor: oleksost \nDate: Mon Sep 18 17:11:29 2023 +0000\n\n removed gcr related stuff in evals\n\ncommit 37306d612cc6d427cb8a10f192ab96f02a75288c\nAuthor: oleksost \nDate: Mon Sep 18 17:06:51 2023 +0000\n\n delete eval\n\ncommit df6f327ebac1aeb3aea18bafe454d9cf78a0cc5d\nAuthor: oleksost \nDate: Mon Sep 18 16:57:10 2023 +0000\n\n removed eval ni old\n\ncommit 9234b79abecabdcc56c47722699c1140a2ca79e0\nMerge: f47a0c5 6424154\nAuthor: oleksost \nDate: Mon Sep 18 16:52:51 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit f47a0c5d31cb4f1567fada550ed40c9c1ef591d4\nAuthor: oleksost \nDate: Mon Sep 18 16:20:20 2023 +0000\n\n debug\n\ncommit 6424154d20cbc792a01b2c9a723a64a236abec32\nMerge: fec0901 9e581d5\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 12:19:13 2023 -0400\n\n Merge pull request #28 from pclucas14/platypus_enforce_eos\n\n Platypus enforce eos\n\ncommit 9e581d52aac1892a43fd66179ff2dd24463346ab\nMerge: ecf3f57 fec0901\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 12:18:50 2023 -0400\n\n Merge branch 'platypus' into platypus_enforce_eos\n\ncommit ecf3f57506b95ecba8224fef865c33d8c0a6215f\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 12:17:02 2023 -0400\n\n nitpicks\n\ncommit fec0901ef68700f552f7f3d185afe5fd0aa0bdc4\nMerge: d3b583d 542bc36\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 12:09:11 2023 -0400\n\n Merge pull request #25 from pclucas14/platypus_eval_dtype\n\n Dtype for evaluation\n\ncommit 542bc365b1768e94dd62949adb6f7f8f6251d560\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 09:09:00 2023 -0700\n\n remove hp\n\ncommit 79089453b8ac7705a2e6d1274121485988b46e4e\nMerge: c55d6f7 d3b583d\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 09:08:05 2023 -0700\n\n fix merge stuff\n\ncommit d3b583d886d636ecc63c2a6b6ddecb176038139e\nMerge: b3ed9d0 f295e71\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 12:03:41 2023 -0400\n\n Merge pull request #24 from pclucas14/platypus_ni_eval\n\n Debugged evaluation on sni\n\ncommit f295e716d799f225432a4aa4d89171fdc7e5f6f8\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 09:03:33 2023 -0700\n\n last comments\n\ncommit 8292655d4a853ea572da0acd63a207d92f299150\nAuthor: Alessandro Sordoni \nDate: Mon Sep 18 08:57:52 2023 -0700\n\n task names are equal task identifiers\n\ncommit 4d1d5e7d0ac87f3a8c1043e5d32e76cba2faad95\nMerge: 1006e49 b3ed9d0\nAuthor: oleksost \nDate: Thu Sep 14 23:49:39 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit b3ed9d05daf91f59a2b91495ba7ec928c1a8d545\nAuthor: oleksost \nDate: Thu Sep 14 23:48:30 2023 +0000\n\n remove prepare_model_for_int8_training\n\ncommit 122c6651035189baa63e122d5e9663113c44417a\nAuthor: oleksost \nDate: Thu Sep 14 23:07:20 2023 +0000\n\n debugging llama\n\ncommit 1006e4940343c8c310eb4fe2e4cdfb6daa4ea0f1\nAuthor: oleksost \nDate: Thu Sep 14 21:41:26 2023 +0000\n\n per task/category logging\n\ncommit 1b2fb2c58c27db10e4adabb80a7ecaf76d932607\nAuthor: oleksost \nDate: Thu Sep 14 20:25:44 2023 +0000\n\n wip\n\ncommit c55d6f78d8863edfb0da89ec15821f6f0ffa1d97\nAuthor: oleksost \nDate: Thu Sep 14 18:28:33 2023 +0000\n\n debug\n\ncommit 376a8ea549f211027bab7ccf79ec2666aac3985e\nAuthor: oleksost \nDate: Thu Sep 14 18:27:49 2023 +0000\n\n wip\n\ncommit 47bd3418a8c179fa4f05de1488dc1ee01fc8882d\nMerge: c0822e4 0219e94\nAuthor: oleksost \nDate: Thu Sep 14 18:24:34 2023 +0000\n\n Merge branch 'platypus_eval_dtype' into platypus_xr\n\ncommit c0822e413395bf3c73a121c72f98348c86d50666\nAuthor: oleksost \nDate: Thu Sep 14 18:24:06 2023 +0000\n\n wip\n\ncommit 3870c6ccf65593595f0f99bb556c5c69d6d3ba15\nAuthor: oleksost \nDate: Thu Sep 14 18:12:17 2023 +0000\n\n tiny bug with multiprocess environment\n\ncommit 0219e94b0d111f7548874b31a99978ce124a45c1\nAuthor: oleksost \nDate: Thu Sep 14 18:00:04 2023 +0000\n\n to cuda\n\ncommit 838f475afa039d08e5765c2b8781389221cf1ab9\nAuthor: oleksost \nDate: Thu Sep 14 17:59:20 2023 +0000\n\n to cuda\n\ncommit 437e6d30c82cae6a8a6b1125f12a2a6031002f41\nMerge: dadfbbd 71bbf13\nAuthor: oleksost \nDate: Thu Sep 14 17:56:56 2023 +0000\n\n Merge branch 'platypus_eval_dtype' into platypus_xr\n\ncommit 1fad024734571563200a49c3217ec0452cf7c1cc\nAuthor: oleksost \nDate: Thu Sep 14 17:39:14 2023 +0000\n\n enforce eos token\n\ncommit 289ff5bad6e1dbf445f32a0dd852723e43f4777f\nAuthor: oleksost \nDate: Thu Sep 14 15:41:30 2023 +0000\n\n enforce eos if loaded tokenizer does it\n\ncommit 71bbf1350c03ae20fa3290e297ff665109cb8804\nAuthor: oleksost \nDate: Wed Sep 13 21:40:01 2023 +0000\n\n cleaned\n\ncommit dadfbbd4b81352d778b50cfffdd66dbddf85a07f\nAuthor: oleksost \nDate: Wed Sep 13 21:23:53 2023 +0000\n\n wip\n\ncommit 3b7ad02e214ad9e0f68621493bb0c101dc992e27\nAuthor: oleksost \nDate: Wed Sep 13 21:09:34 2023 +0000\n\n load for eval\n\ncommit 2b031d6ef69298927facc9f90f2d883f06ce5fc6\nAuthor: oleksost \nDate: Wed Sep 13 21:06:51 2023 +0000\n\n wip\n\ncommit b3ea2c4cc51fa8722435838877bb3048ff6f9cc0\nAuthor: oleksost \nDate: Wed Sep 13 20:58:47 2023 +0000\n\n wip\n\ncommit 07d14fd0fbce3969e9d728d58b77b82e0a3dec8e\nMerge: 318c22a d941756\nAuthor: oleksost \nDate: Wed Sep 13 19:59:18 2023 +0000\n\n Merge branch 'platypus_vsmear_dirichlet' into platypus_xr\n\ncommit d9417568a25bc823aaad8bde3ac6991d3796d0ed\nAuthor: oleksost \nDate: Wed Sep 13 19:45:25 2023 +0000\n\n variational smear with dirichlet dist\n\ncommit 496ae90f7ddbda120b7bd5f6f2b837bce704fb85\nAuthor: oleksost \nDate: Wed Sep 13 18:22:15 2023 +0000\n\n wip\n\ncommit 52b89c7d29181d5f1054161e2a3764ba00976290\nAuthor: oleksost \nDate: Wed Sep 13 14:00:23 2023 +0000\n\n sep of concerns\n\ncommit 30a445d55ef984c356ffdd7f8484c2aedee3c9ad\nAuthor: oleksost \nDate: Wed Sep 13 13:56:40 2023 +0000\n\n removed unnecessary\n\ncommit 6868210c75b446d6d5ba69e0a6647d4223a8c6ba\nAuthor: oleksost \nDate: Wed Sep 13 13:55:33 2023 +0000\n\n typo\n\ncommit 86cc35671628e17ad10a6d8d56670b2dfb168214\nAuthor: oleksost \nDate: Wed Sep 13 13:53:28 2023 +0000\n\n nvm\n\ncommit 318c22a89c91aa22f663f0d7a94c97decbba70e7\nAuthor: oleksost \nDate: Wed Sep 13 13:52:07 2023 +0000\n\n wip\n\ncommit 168c35573743a3c86982a4ec7727623eb5cea2e5\nMerge: 86f8ef0 b24331f\nAuthor: oleksost \nDate: Wed Sep 13 13:52:00 2023 +0000\n\n Merge branch 'platypus_ni_eval' into platypus_xr\n\ncommit 86f8ef0c809d4fe9af888d8f6fcead3cde1fb73c\nMerge: 07d8154 faff1bb\nAuthor: oleksost \nDate: Wed Sep 13 13:16:08 2023 +0000\n\n Merge branch 'platypus_eval_dtype' into platypus_xr\n\ncommit faff1bb681aceae34c6e19f2e5d034863b65948d\nAuthor: oleksost \nDate: Wed Sep 13 13:15:58 2023 +0000\n\n var name\n\ncommit 07d8154a82de42b67b259fa60fc2f3007e96d79e\nAuthor: oleksost \nDate: Wed Sep 13 13:14:35 2023 +0000\n\n wip\n\ncommit 8ac6429c4c575a6978a205bef9616765c04f4576\nAuthor: oleksost \nDate: Wed Sep 13 13:14:26 2023 +0000\n\n wip\n\ncommit c2f05bc396dffe2b41a84f294931167992f779c7\nMerge: 3b7ceba 0edec10\nAuthor: oleksost \nDate: Wed Sep 13 13:11:31 2023 +0000\n\n Merge branch 'platypus_eval_dtype' into platypus_xr\n\ncommit 0edec10d0c4a6dad249194e11fb38c644bdfae40\nAuthor: oleksost \nDate: Wed Sep 13 13:10:47 2023 +0000\n\n typo\n\ncommit 3b7ceba2d34e0298bf7b2d774118a584bec48c24\nMerge: 18a87a1 11d17c5\nAuthor: oleksost \nDate: Wed Sep 13 13:09:53 2023 +0000\n\n Merge branch 'platypus_eval_dtype' into platypus_xr\n\ncommit 11d17c5b892cdf61f0ac6d3d22898a3758fe871c\nAuthor: oleksost \nDate: Wed Sep 13 13:07:03 2023 +0000\n\n Dtype for evaluation\n\ncommit b24331f7ba811a79c2ccf074c891ef15dd7b2295\nAuthor: oleksost \nDate: Wed Sep 13 12:48:52 2023 +0000\n\n no labels to None in ni_module to not break mhr\n\ncommit 18a87a1e511717d9530391840cbef41e3eb350a5\nAuthor: oleksost \nDate: Wed Sep 13 12:39:41 2023 +0000\n\n wip\n\ncommit 6067f24ab5b380886e3cb5b2a57b613aa3a907d3\nAuthor: oleksost \nDate: Tue Sep 12 16:57:20 2023 +0000\n\n addressed bug with task id and output path\n\ncommit c58f529a2138a38ae3bfa9c1edd39f1a97186052\nAuthor: oleksost \nDate: Tue Sep 12 16:54:41 2023 +0000\n\n wip\n\ncommit 559438d6a183f9c7c8758581ee77a85bf82f81a4\nAuthor: oleksost \nDate: Tue Sep 12 13:52:57 2023 +0000\n\n uncomment line\n\ncommit a722f176143b25c288a71c0cafe7a6afd819566c\nAuthor: oleksost \nDate: Tue Sep 12 13:42:35 2023 +0000\n\n wip\n\ncommit e5fe9a603be91fd686506d3ce1c10a8d4f6d678c\nMerge: c63b7c2 465899f\nAuthor: oleksost \nDate: Tue Sep 12 12:05:54 2023 +0000\n\n Merge branch 'platypus_ni_eval' into platypus_xr\n\ncommit 465899fe3df8e8a2a32f7e7d5dd73a22356720b4\nAuthor: oleksost \nDate: Tue Sep 12 04:41:58 2023 +0000\n\n pet task/cat ni evaluator\n\ncommit c63b7c2fb3747d52853ec2ec4338f9ef02d98889\nAuthor: oleksost \nDate: Mon Sep 11 23:55:07 2023 +0000\n\n wip\n\ncommit b8841f5a306e43d681b4e04a423806ccab3467e6\nAuthor: oleksost \nDate: Mon Sep 11 22:17:12 2023 +0000\n\n to(\"cuda\") but\n\ncommit 9d6c66f26a83da01efd77812bda772530893eff9\nAuthor: oleksost \nDate: Mon Sep 11 22:11:56 2023 +0000\n\n addressed comments\n\ncommit affb59672568e36a5c8a3bd90067513f6bbcec29\nAuthor: oleksost \nDate: Mon Sep 11 20:41:33 2023 +0000\n\n wip\n\ncommit 06bf782d50dd651515cdf0bcbafa48d29240e79e\nAuthor: oleksost \nDate: Mon Sep 11 19:51:52 2023 +0000\n\n wip\n\ncommit 82b63c0aa2472785f9271bedab8354e879cf6338\nMerge: 312eab3 06ef185\nAuthor: oleksost \nDate: Mon Sep 11 18:37:11 2023 +0000\n\n Merge branch 'platypus_ni_eval' into platypus_xr\n\ncommit 06ef1851f137695154c4b11c0dc36efdc1419bab\nAuthor: oleksost \nDate: Mon Sep 11 18:22:26 2023 +0000\n\n removed redundant ni_metrics file\n\ncommit f010742eddf037f396b0a8c5df8e3157f5c34b96\nAuthor: oleksost \nDate: Mon Sep 11 16:55:34 2023 +0000\n\n addressed comments\n\ncommit d40c3317fdb27b2eb9dd6755d2d4dc09eb409db6\nAuthor: oleksost \nDate: Mon Sep 11 16:46:29 2023 +0000\n\n remove force adding eos token\n\ncommit 312eab3c78efb7c06ec0d56ce8ad228380a973c1\nAuthor: oleksost \nDate: Mon Sep 11 15:42:16 2023 +0000\n\n wip\n\ncommit b2eb520510e0ead4a9a2041625e87f2ecb880000\nAuthor: oleksost \nDate: Mon Sep 11 15:41:36 2023 +0000\n\n wip\n\ncommit 75953247273a0799f0e49d5438341105fe1c1e50\nAuthor: oleksost \nDate: Mon Sep 11 15:11:14 2023 +0000\n\n black formatting + removed unnecessary imports\n\ncommit 86d43880345bc12a94a4dce4ca7fc0a2c80280c1\nAuthor: oleksost \nDate: Mon Sep 11 14:53:02 2023 +0000\n\n ni_eval debug\n\ncommit 22ef56cd82d072c1d8b941f1b3fab0de4d5edd77\nAuthor: oleksost \nDate: Mon Sep 11 14:21:43 2023 +0000\n\n ni eval + wip\n\ncommit 9fb9ce5817f2b11b00c0bd820223189833cdb084\nAuthor: oleksost \nDate: Sun Sep 10 14:44:13 2023 +0000\n\n super ni eval debug + reoganize scripts\n\ncommit 66020363cea591ccd87cf538d14f0d7c15713233\nAuthor: oleksost \nDate: Fri Sep 8 22:22:21 2023 +0000\n\n validate llama\n\ncommit f77f85b11d5885be07b582f158fa6cea68640324\nAuthor: oleksost \nDate: Fri Sep 8 22:22:13 2023 +0000\n\n evaluate ni, mmlu\n\ncommit 13055ad8931940cebf4bbabb5664a1c364d55094\nAuthor: oleksost \nDate: Fri Sep 8 17:47:28 2023 +0000\n\n ni evaluator with task description\n\ncommit 2ac1f966e505121f5c4d67b1bfee2cdcc2db0ce8\nAuthor: oleksost \nDate: Fri Sep 8 16:31:42 2023 +0000\n\n save ni generations on disk\n\ncommit c51ff5ffe2b29cbeda58e2635fe498912580dbd9\nMerge: cb48998 a6ca0a3\nAuthor: oleksost \nDate: Fri Sep 8 14:44:43 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit a6ca0a3cb37cf7fe41ae38d092d82cb014086ffa\nAuthor: Alessandro Sordoni \nDate: Fri Sep 8 14:44:05 2023 +0000\n\n max_input_length as option to callbacks\n\ncommit cb489988ad8e19258309d05cf832d2f13aa59ac5\nMerge: 9d223ab c438351\nAuthor: oleksost \nDate: Fri Sep 8 14:42:33 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit 9d223abae13d41dd641fcebbef0a99564c83db57\nAuthor: oleksost \nDate: Fri Sep 8 14:40:05 2023 +0000\n\n wip\n\ncommit 4ba5804a0f2327b86600013e9140e03a72eef295\nAuthor: oleksost \nDate: Thu Sep 7 20:17:45 2023 +0000\n\n softmoe with right padding\n\ncommit 046b23690bddf2601cadbec54c9fa929b82d2948\nMerge: 5c9452f a984050\nAuthor: oleksost \nDate: Thu Sep 7 20:16:25 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit c438351fc03e63827c54f799343cfa4639981823\nMerge: db27133 087f7a9\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 19:58:48 2023 +0000\n\n Merge remote-tracking branch 'origin/platypus' into wiki-experts\n\ncommit 087f7a9809b5c994984a8610d16304ffe3459112\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 19:40:52 2023 +0000\n\n collator fix\n\ncommit 5c9452f23a5d69dec7c7fc4bdf3da08e64a23b71\nAuthor: oleksost \nDate: Thu Sep 7 19:31:57 2023 +0000\n\n wip\n\ncommit a984050cab2f4bf676ad64405faa4ffd015fd537\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 19:30:08 2023 +0000\n\n set padding side for seq2seq too\n\ncommit e12f04844f3d1f444c5bd0a5ea0f9fd7d945daca\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 19:28:52 2023 +0000\n\n padding side as an option\n\ncommit d53d017195ce63c0e1027ea324a687ee56b0c45c\nMerge: bafbe23 7ec4b32\nAuthor: oleksost \nDate: Thu Sep 7 19:05:35 2023 +0000\n\n Merge branch 'platypus' into platypus_xr\n\ncommit 5eeb501ac4487746c93a7447c8c2f7d350c91e15\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 18:55:01 2023 +0000\n\n pad right support\n\ncommit db2713371fe4b308dbdc39b64ab9a179e7e14623\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 16:43:49 2023 +0000\n\n rename\n\ncommit 8eeb0776b7500948b48dfd4fed072b62d319a15d\nMerge: ba3bf5b 7ec4b32\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 16:43:24 2023 +0000\n\n Merge remote-tracking branch 'origin/platypus' into wiki-experts\n\ncommit 7ec4b327a090681109eae692a9c56162d8ea2c2d\nAuthor: oleksost \nDate: Thu Sep 7 16:37:32 2023 +0000\n\n set float32 matmul precision\n\ncommit bafbe2390a303ab682198861e72175ee32eca0a2\nAuthor: oleksost \nDate: Thu Sep 7 16:34:47 2023 +0000\n\n wip - configs\n\ncommit 217791f64cd381f6d63e853426902b4630609002\nAuthor: oleksost \nDate: Thu Sep 7 16:03:01 2023 +0000\n\n set float matmult precision\n\ncommit ba3bf5b18f26e309adcc5dc9ed456124e60d19ea\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 15:43:00 2023 +0000\n\n fix right padding, -100 for pad tokens\n\ncommit 11fdac3956e8d3e689b8cab4992921fb71efbce0\nAuthor: oleksost \nDate: Thu Sep 7 13:34:56 2023 +0000\n\n make sure the last token is eos when trunctating\n\ncommit adeaf2ef577648bbd8aeee6feac33de1f1a6e22d\nAuthor: oleksost \nDate: Thu Sep 7 12:34:52 2023 +0000\n\n wip\n\ncommit efad5bce4e615189e2ea4fbd46d62d9cf91da118\nAuthor: Alessandro Sordoni \nDate: Thu Sep 7 03:31:03 2023 +0000\n\n fix task_names\n\ncommit 94eecd443da8a77cc63423d8bb1174802dace24e\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 22:32:55 2023 +0000\n\n sort task names for repro\n\ncommit d51f19dc2bb21472ff0347f88251844d35440226\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 22:27:59 2023 +0000\n\n only pad left for generation!\n\ncommit 430562b36f6f43ef8d6370bfdf85f2870ed89d76\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 22:17:57 2023 +0000\n\n task sampler got right\n\ncommit 5d5460b0c23de42d37c162af34e0270f76f2a373\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 22:17:29 2023 +0000\n\n remove unused method\n\ncommit 49bb48d087d233831d958d7e5142157d9c6fc5fd\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 21:03:21 2023 +0000\n\n online eval uses new datamodule\n\ncommit 04d7f077e6ceff89d5a32741138afbb4fe61c77c\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 04:09:42 2023 +0000\n\n cleanup / sampler\n\ncommit f651501e186b2a2c7b5b61614ae0c93c960b5cd7\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 04:09:18 2023 +0000\n\n private routing\n\ncommit 58aebfb793a4c81d9fb8db1a18a46b2b771874de\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 02:13:37 2023 +0000\n\n lm trainer\n\ncommit 31672781cfd457deaf39225472b2fdb4a377b79b\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 02:13:32 2023 +0000\n\n train experts\n\ncommit 8f0ec5ebeba3b08b9efb0527b5bc9b4db0e59ae9\nAuthor: Alessandro Sordoni \nDate: Wed Sep 6 02:13:14 2023 +0000\n\n mini fix\n\ncommit 8afad0034b4a0258856ace4a453ddb23e17c98b4\nAuthor: oleksost \nDate: Tue Sep 5 21:57:44 2023 +0000\n\n softmoe debug\n\ncommit 956c194c2443888ab70a091073fae5659900ef12\nAuthor: oleksost \nDate: Tue Sep 5 20:37:01 2023 +0000\n\n reproduction runs SI\n\ncommit 7cf9248c863aee642f6ee819e6fce121adcb7b49\nAuthor: oleksost \nDate: Tue Sep 5 19:00:21 2023 +0000\n\n wip\n\ncommit ebe65f4c6b4e529de897b10aac80b99908a34835\nAuthor: oleksost \nDate: Tue Sep 5 18:55:51 2023 +0000\n\n eval ni w subsample\n\ncommit bd2fa3f9a29a8c52c5f0ae98ae2455c1f82a1e7f\nMerge: 1db25b4 d86a7e8\nAuthor: oleksost \nDate: Tue Sep 5 18:52:54 2023 +0000\n\n Merge branch 'platypus' into platypus_vsmear_w_rgulaizer\n\ncommit d86a7e8b21ccc74248c9d45f2e2a5c4dce504074\nAuthor: oleksost \nDate: Tue Sep 5 18:50:45 2023 +0000\n\n selector per layer logging\n\ncommit 94044fb98fe5729c38cb4d541ded32ee9d0e82d3\nAuthor: Alessandro Sordoni \nDate: Tue Sep 5 18:48:26 2023 +0000\n\n skilled modifier\n\ncommit b181d7526b6245978bb52b4d032a8d775538faae\nAuthor: oleksost \nDate: Tue Sep 5 18:45:50 2023 +0000\n\n eval ni w subsample\n\ncommit 4e5496206aec894e8f5c256a01c24e4582c207b1\nAuthor: oleksost \nDate: Tue Sep 5 18:37:47 2023 +0000\n\n ni eval w subsample\n\ncommit 1db25b4cf04e3b5fc15dcad67cda94c3855118b4\nAuthor: oleksost \nDate: Tue Sep 5 18:34:08 2023 +0000\n\n wip\n\ncommit dc809423e6930232cd84545a0367203bcc086b7b\nAuthor: Alessandro Sordoni \nDate: Tue Sep 5 18:25:07 2023 +0000\n\n wikipedia for mmlu\n\ncommit 226d44f8afa6cd30f1ed46d7cbed6acdfdbaba79\nAuthor: oleksost \nDate: Tue Sep 5 18:03:33 2023 +0000\n\n wip\n\ncommit ebdda74e9cfecdeb9a9a81a4b9efd2655f1ef5ad\nMerge: 7da2234 c9bccdf\nAuthor: oleksost \nDate: Tue Sep 5 17:26:34 2023 +0000\n\n Merge branch 'platypus' into platypus_vsmear_w_rgulaizer\n\ncommit c9bccdf8d63a7dc26f3dd573d1fce435b4ab8aa3\nMerge: ce0fade 0429593\nAuthor: oleksost \nDate: Tue Sep 5 17:25:15 2023 +0000\n\n Merge branch 'platypus' of https://github.com/pclucas14/lucas_mttl into platypus\n\ncommit 7da2234531fe7fd28307f63f56240fc605cdc9a4\nAuthor: oleksost \nDate: Tue Sep 5 17:25:03 2023 +0000\n\n xr4\n\ncommit 04295931fc5d0b6728c07a85ee1f3d2310748bc7\nAuthor: Alessandro Sordoni \nDate: Tue Sep 5 17:07:54 2023 +0000\n\n gitignore\n\ncommit 2d0acb6d390d79ab097ce90dc6c6de54e6bea6cb\nAuthor: Alessandro Sordoni \nDate: Tue Sep 5 17:07:31 2023 +0000\n\n remove yaml\n\ncommit 027761405901b760d1377343a25b553f5b9ea4bd\nMerge: 28f1c91 ec74a54\nAuthor: Alessandro Sordoni \nDate: Tue Sep 5 13:04:34 2023 -0400\n\n Merge pull request #23 from pclucas14/platypus-clean-monitors\n\n Platypus clean monitors\n\ncommit a89718b91914da2fdbe63cdbe4e56b1683842835\nAuthor: oleksost \nDate: Tue Sep 5 16:52:03 2023 +0000\n\n per layer selector logging\n\ncommit 2906f5fa34984b2da0f812c732efc0d08385054d\nAuthor: oleksost \nDate: Tue Sep 5 16:48:11 2023 +0000\n\n merging platypus\n\ncommit 688a3d317fa55da9c135c1405ccdf09c5429265d\nMerge: 848100b ce0fade\nAuthor: oleksost \nDate: Tue Sep 5 16:47:44 2023 +0000\n\n Merge branch 'platypus' into platypus_vsmear_w_rgulaizer\n\ncommit ce0fade3a6386054afc5f9bc1164c09997a0f639\nMerge: 28f1c91 ec74a54\nAuthor: oleksost \nDate: Tue Sep 5 16:44:55 2023 +0000\n\n Merge branch 'platypus-clean-monitors-local' into platypus\n\ncommit 28f1c919b9568b83f1103863a6291b4718275bbf\nAuthor: oleksost \nDate: Mon Sep 4 22:45:51 2023 +0000\n\n softmoe\n\ncommit 335fd2f4eea317a5b0aaf43fc4c6ac6a8e782393\nAuthor: oleksost \nDate: Mon Sep 4 22:45:38 2023 +0000\n\n softmoe\n\ncommit ec74a547852c31d5c3ca87fc4120103a44dd4e53\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 22:07:23 2023 +0000\n\n subsample fix\n\ncommit bb93e9b42341bd8b35c82268997f4b4496edb4cf\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 22:03:18 2023 +0000\n\n subsample n proportion per task\n\ncommit 7eac27986375bf79c6c636b40281e291ebc690af\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 19:31:09 2023 +0000\n\n support for train_on_inputs\n\ncommit bff1cf39ffe1c217350c70774d84af758e639916\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 19:30:55 2023 +0000\n\n sigh\n\ncommit d460edce95ec483648cc72ea4d952a024bac85ad\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 16:58:06 2023 +0000\n\n fix\n\ncommit 8087975e6590d5cac5d4cc0a898263c1c3c9a377\nAuthor: Alessandro Sordoni \nDate: Mon Sep 4 03:44:04 2023 +0000\n\n switch ni to original data module\n\ncommit 16da6e5f3ca5a994c6aa5f50e1b2b0e1e0096f7a\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 21:31:34 2023 +0000\n\n ni orig data mod supports finetune_task_name\n\ncommit e440999fc5c8129adb8386b673fd1ede21f5ace2\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 21:31:15 2023 +0000\n\n move decode in fn\n\ncommit 06a7e63a9d19158ce9b4bf455eb21a19b25810d0\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 04:14:24 2023 +0000\n\n handle few shot properly in ni\n\ncommit 0f471e7a1821e69d7030934b280c6a8b9acf459b\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 04:13:42 2023 +0000\n\n cut max instances per task only on train/valid for sni, not on test\n\ncommit 35cb8b4d3b4c3d5f4048d5247fad76c5f0bd6d99\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:37:26 2023 +0000\n\n subsample\n\ncommit 374795547e132a129fc0a0754f108d0f68d7b5ca\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:36:39 2023 +0000\n\n rename to task_to_id\n\ncommit 439a7cf5b74cc92b2c4a2f4d0e716ada88748a02\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:36:27 2023 +0000\n\n support for finetune_task_name ...\n\ncommit 5ad7ffa94f3e4c1f08576ae89a786d57fa6ebc94\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:36:15 2023 +0000\n\n setup_dataset\n\ncommit 046b49725193436328d80b1acdce5ab958af81af\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:34:01 2023 +0000\n\n fix bug in label_smoothed_nll_loss when ignore_index is negative\n\ncommit 223b42c754a8362965df1f304ec3f7a6aba168a9\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:17:06 2023 +0000\n\n setup logging for mhr\n\ncommit 80a4fadd65430298d113505263d479520fa6bc76\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:05:21 2023 +0000\n\n cleanup\n\ncommit 835751dec0d9da04a619d9787163c09c32aa51f8\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:03:47 2023 +0000\n\n train_dir -> data_dir\n\ncommit 8b90ef558690b410eff187ae3e5c877d7ccf539d\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 03:02:55 2023 +0000\n\n rename method\n\ncommit 0e172e89fa655aa32a417cec2944cd076dbdc086\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 02:53:34 2023 +0000\n\n lil bit of cleaning\n\ncommit 02d68eaf6e4430dae72f27d7bf79eaee66a0eeaa\nAuthor: Alessandro Sordoni \nDate: Sun Sep 3 02:37:40 2023 +0000\n\n save stddev\n\ncommit 722ff55d41d3fcbbc6af476fe1adffd945e4328f\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 23:13:38 2023 +0000\n\n monitor modif\n\ncommit 40a194705b3e13f6031ca2b70d5ef84d76f453fd\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 23:11:42 2023 +0000\n\n finish refact\n\ncommit 15e929e5917e0611b9c8c98b9bc830b8f1a3ff23\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:49:37 2023 +0000\n\n delimiter\n\ncommit f702a14bcd3c9124b3ba7a319ddb425d435bf1f9\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:40:37 2023 +0000\n\n fix var name\n\ncommit 0668100e81f28834fa563328b31b2eecffcf107a\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:40:12 2023 +0000\n\n adjust for mean\n\ncommit 8abc1851c08c0e435c79af9515c25277b41fe6b9\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:36:03 2023 +0000\n\n setup logging accepts log_dir = None\n\ncommit 9528b39d0b965e60a9d2ecbd1ac769038b0018c7\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:34:44 2023 +0000\n\n use mttl logger everywhere\n\ncommit 565638386725b6c7b5871b92a255028e600bf619\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:32:03 2023 +0000\n\n task aggregation\n\ncommit 8ebcff37c927ddb15521191b000c9f2d5551b917\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:28:00 2023 +0000\n\n mean_stderr\n\ncommit 41ad3805b96d8ddc3286451bc39d83af5e676ad0\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:09:59 2023 +0000\n\n dumps->dump\n\ncommit 50efdb0729ee1a523950084cc6778173bdc8c4f5\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:02:58 2023 +0000\n\n remove min/max on monitor\n\ncommit 7f44234bd8a1e16135f4b7aee8a1c850b6a9abcc\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 21:00:42 2023 +0000\n\n move model to gpu?\n\ncommit 4278807dbf71e9c816c83c14b0e1dac3b5ea80f9\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:55:09 2023 +0000\n\n dist utils only eval on main process\n\ncommit d48458cf0d70eb6c5ecf026a94e3862e5cc32ae4\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:40:57 2023 +0000\n\n save all metrics for mmlu/ni\n\ncommit 39437af0a2ce344c48c15b2f325fb250e18003c4\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:40:30 2023 +0000\n\n remove metric per task\n\ncommit c53d815db668cf6fd7038ea900734249d84644ae\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:23:48 2023 +0000\n\n turn off evals for now\n\ncommit 41f87f5dd195ddfc60c435c20c27a50ce9596bac\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:21:03 2023 +0000\n\n just indents\n\ncommit 883ebb1f1e4a897c863ab55275e8bb3acad89db4\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 20:20:41 2023 +0000\n\n mean over aux losses\n\ncommit 80f0ae6ff5489c02779de1b650ac0ce2d7b7298e\nAuthor: Alessandro Sordoni \nDate: Sat Sep 2 00:35:36 2023 +0000\n\n fix ni decoding when not using gpt\n\ncommit a21142824a511544b86972dc90cb985dc751f425\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 20:31:10 2023 +0000\n\n cache inputs for generation into routing infos\n\ncommit 82874cd3e0b33d5d5b49a5ef9b1bb29b7273bf68\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 19:41:52 2023 +0000\n\n clear cache\n\ncommit 7653b4c7bd8386d88ef73fa3748fe71a6c8e1b8a\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 19:13:08 2023 +0000\n\n vsmear fix norm\n\ncommit f303f554b8c988c30918a15b63d9e82491926133\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 19:13:02 2023 +0000\n\n centering for smear helps routing mi\n\ncommit 7a0de493785d66936b4cad4e192a99cb77bb7446\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 17:13:38 2023 +0000\n\n some loggin' for smear\n\ncommit 86c1cf57ae4b9dd3b492f38749ba46ebeb8cd5b2\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 17:06:21 2023 +0000\n\n dino-v2 type centering\n\ncommit 338b554302fb5c0af40f76f18c9617b1041cbedd\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 16:35:12 2023 +0000\n\n smear kl term\n\ncommit 17d60b77dbf74c26815d82c3212b7390eeb6b84c\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 16:33:57 2023 +0000\n\n unused imports\n\ncommit b7c4e2e7d51e6508cfa2805c864feb5b89e0f51e\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 16:31:50 2023 +0000\n\n l2 weight normalization\n\ncommit ee4e250ff84456db87cc290f61cb826439354faf\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 16:21:18 2023 +0000\n\n averager don't start from 0\n\ncommit 70d45361d5dab553229d132e10932dbf70767d18\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 14:55:52 2023 +0000\n\n fix routing info bug\n\ncommit 848100b698796432b593ef4b0525e52376dc574f\nAuthor: oleksost \nDate: Fri Sep 1 14:34:53 2023 +0000\n\n wip\n\ncommit cec30f187f6d3cc1a48fbe0365625cc803f6f065\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 14:27:16 2023 +0000\n\n fix args.tensorboard missing\n\ncommit d6f3345454e5f851acebfa068731bd7c8b7fff06\nMerge: a90d42e d7146cf\nAuthor: oleksost \nDate: Fri Sep 1 13:21:01 2023 +0000\n\n Merge branch 'platypus-clean-monitors' into platypus_vsmear_w_rgulaizer\n\ncommit a90d42eefc2ca76e1d94390e4212a3261f9c85a6\nAuthor: oleksost \nDate: Fri Sep 1 13:17:06 2023 +0000\n\n wip\n\ncommit d7146cf6c214190e2420078b9ee85a1e9ae56fb6\nAuthor: Alessandro Sordoni \nDate: Fri Sep 1 03:33:31 2023 +0000\n\n correct averager\n\ncommit c1d6d824c5773dc3f61df19b1e9a04d0e8d3c4e0\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 19:36:01 2023 +0000\n\n fix eta\n\ncommit fb59c2cccd41ed1a746833c008fe7cc854a6364e\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 19:02:01 2023 +0000\n\n remove\n\ncommit 2686f1ea1d7fe473a5d4b48218267fee89f5c237\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 18:58:00 2023 +0000\n\n back-compatibility\n\ncommit d32e46265a0b3c23ed08b603fc6d49454932e747\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 18:52:59 2023 +0000\n\n eta\n\ncommit 9f41924aeb3e4de5141342bf19af8abfa4c9348c\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 16:12:21 2023 +0000\n\n need to clone torch vars\n\ncommit b5fdb00867237a4f8efd6a46c742c8871f614110\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 15:56:51 2023 +0000\n\n metric sugar\n\ncommit a366fc755e9d88076ce2e9bb2f67b44b95e30232\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 15:48:44 2023 +0000\n\n min, max, avg agg of dicts\n\ncommit c8f62aeddd0be538f2c3537e19e31d515c59e9ac\nAuthor: Alessandro Sordoni \nDate: Thu Aug 31 15:34:18 2023 +0000\n\n rename fix\n\ncommit fc76c2861630ed9024f1a071eb0fc8c0e091501d\nAuthor: Alessandro Sordoni