{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":584182682,"defaultBranch":"main","name":"language-modeling","ownerLogin":"andstor","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-01-01T18:20:10.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/21249611?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1672597211.145716","currentOid":""},"activityList":{"items":[{"before":"a24b79efe9804c8cbe3097648e8e484513f2425d","after":"fb58a4b95bfd872b179dd5e3c9f7449d02a67767","ref":"refs/heads/main","pushedAt":"2024-05-15T20:00:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add (IA)^3 support","shortMessageHtmlLink":"Add (IA)^3 support"}},{"before":"02b0986ff3ec3aebf3e4dfd13e721be19cbb67e9","after":"a24b79efe9804c8cbe3097648e8e484513f2425d","ref":"refs/heads/main","pushedAt":"2024-05-02T15:03:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix compute_metrics problem","shortMessageHtmlLink":"Fix compute_metrics problem"}},{"before":"775588cf85c3603f9bab0a4b77d8e2e238965278","after":"02b0986ff3ec3aebf3e4dfd13e721be19cbb67e9","ref":"refs/heads/main","pushedAt":"2024-05-02T11:32:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add scheduler auto total_num_steps to DeepSpeed configs","shortMessageHtmlLink":"Add scheduler auto total_num_steps to DeepSpeed configs"}},{"before":"9adc935d11639cc20bbcf6de15df34217220557a","after":"775588cf85c3603f9bab0a4b77d8e2e238965278","ref":"refs/heads/main","pushedAt":"2024-05-02T10:37:49.000Z","pushType":"force_push","commitsCount":0,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix evaluation compatibility with prompt tuning","shortMessageHtmlLink":"Fix evaluation compatibility with prompt tuning"}},{"before":"d9aa248230fd84abd13b02baedfaf731e963eb51","after":"9adc935d11639cc20bbcf6de15df34217220557a","ref":"refs/heads/main","pushedAt":"2024-05-02T10:34:08.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix evaluation compatibility with prompt tuning","shortMessageHtmlLink":"Fix evaluation compatibility with prompt tuning"}},{"before":"9e8c32ddd69d9be27b6137e3d008acfc91a1cc60","after":"d9aa248230fd84abd13b02baedfaf731e963eb51","ref":"refs/heads/main","pushedAt":"2024-05-02T00:15:04.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix pad_to_multiple_of incompatibility with prompt tuning","shortMessageHtmlLink":"Fix pad_to_multiple_of incompatibility with prompt tuning"}},{"before":"28641cd52a037026c81470fc817d9fe5e8b23997","after":"9e8c32ddd69d9be27b6137e3d008acfc91a1cc60","ref":"refs/heads/main","pushedAt":"2024-05-01T17:39:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix max input size when using prompt tuning","shortMessageHtmlLink":"Fix max input size when using prompt tuning"}},{"before":"64dca091697e4142acb2245df0f8db688e3b79b8","after":"28641cd52a037026c81470fc817d9fe5e8b23997","ref":"refs/heads/main","pushedAt":"2024-05-01T17:12:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix DeepSpeed scheduler to linear","shortMessageHtmlLink":"Fix DeepSpeed scheduler to linear"}},{"before":"736886585eb2370df01ed3129c8564978ec5c00e","after":"64dca091697e4142acb2245df0f8db688e3b79b8","ref":"refs/heads/main","pushedAt":"2024-05-01T17:05:02.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Change learning rate scheduler","shortMessageHtmlLink":"Change learning rate scheduler"}},{"before":"422fe1913f5a8190b85be735a8547aa69920148f","after":"736886585eb2370df01ed3129c8564978ec5c00e","ref":"refs/heads/main","pushedAt":"2024-05-01T16:55:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Change learning rate scheduler","shortMessageHtmlLink":"Change learning rate scheduler"}},{"before":"b80887c760407442eb45a01c8fa151b65a52d067","after":"422fe1913f5a8190b85be735a8547aa69920148f","ref":"refs/heads/main","pushedAt":"2024-04-27T18:49:52.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Allow override block_size","shortMessageHtmlLink":"Allow override block_size"}},{"before":"b66440f812e55fc27c5412d0f1f49ca22bf3c841","after":"b80887c760407442eb45a01c8fa151b65a52d067","ref":"refs/heads/main","pushedAt":"2024-03-18T23:28:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"83a07da52f12b80103fbf6940a94a80aa77bef03","after":"b66440f812e55fc27c5412d0f1f49ca22bf3c841","ref":"refs/heads/main","pushedAt":"2024-03-18T23:27:01.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add seq2seq objective within the causal language modeling paradigm","shortMessageHtmlLink":"Add seq2seq objective within the causal language modeling paradigm"}},{"before":"9654cc651278591fbd1de787cc2f66e4dc8024db","after":"83a07da52f12b80103fbf6940a94a80aa77bef03","ref":"refs/heads/main","pushedAt":"2024-02-25T23:27:06.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update zero configs","shortMessageHtmlLink":"Update zero configs"}},{"before":"81508f011b9997c3ba4fcf006993759f566bb96b","after":"9654cc651278591fbd1de787cc2f66e4dc8024db","ref":"refs/heads/main","pushedAt":"2024-02-25T22:13:35.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Merge branch 'main' of https://github.com/andstor/language-modeling","shortMessageHtmlLink":"Merge branch 'main' of https://github.com/andstor/language-modeling"}},{"before":"b805107fb8fc73d10ccf4f3c11bcf590d4314d5e","after":"81508f011b9997c3ba4fcf006993759f566bb96b","ref":"refs/heads/main","pushedAt":"2024-02-25T20:49:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update requirements.txt","shortMessageHtmlLink":"Update requirements.txt"}},{"before":"a8f7f7ca735285ad3f5ff2feb894d3669b6933c6","after":"b805107fb8fc73d10ccf4f3c11bcf590d4314d5e","ref":"refs/heads/main","pushedAt":"2024-02-25T19:49:30.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update README.md","shortMessageHtmlLink":"Update README.md"}},{"before":"114db5d9c91f41b902be5135b62c5842e99c9b5c","after":"a8f7f7ca735285ad3f5ff2feb894d3669b6933c6","ref":"refs/heads/main","pushedAt":"2024-02-25T19:29:14.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update zero stage 3 configs","shortMessageHtmlLink":"Update zero stage 3 configs"}},{"before":"32309b64bfa1afcafee23761d2c778bf43e566e5","after":"114db5d9c91f41b902be5135b62c5842e99c9b5c","ref":"refs/heads/main","pushedAt":"2024-02-24T20:37:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Restructure and update repository","shortMessageHtmlLink":"Restructure and update repository"}},{"before":"27ff50d0013df5eae21ddf8cf85637c61122d1ed","after":"32309b64bfa1afcafee23761d2c778bf43e566e5","ref":"refs/heads/main","pushedAt":"2024-01-09T00:58:40.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add deepspeed zero 2 config","shortMessageHtmlLink":"Add deepspeed zero 2 config"}},{"before":"11b49cf6fd062ba9e8543b8fc9d9a270c2f9d7e9","after":"27ff50d0013df5eae21ddf8cf85637c61122d1ed","ref":"refs/heads/main","pushedAt":"2024-01-05T00:11:50.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"add deepspeed config","shortMessageHtmlLink":"add deepspeed config"}},{"before":"0783d6a818d6e05054395bf4f46650aaf22f9f6d","after":"11b49cf6fd062ba9e8543b8fc9d9a270c2f9d7e9","ref":"refs/heads/main","pushedAt":"2024-01-04T19:56:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"add deepspeed config","shortMessageHtmlLink":"add deepspeed config"}},{"before":"bd0a9caa84d324340b4e92a21cc5f6db99d8ae1c","after":"0783d6a818d6e05054395bf4f46650aaf22f9f6d","ref":"refs/heads/main","pushedAt":"2024-01-02T03:13:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update zero2 config","shortMessageHtmlLink":"Update zero2 config"}},{"before":"51b23904afbdfa742926d2a8c475901a94a83061","after":"bd0a9caa84d324340b4e92a21cc5f6db99d8ae1c","ref":"refs/heads/main","pushedAt":"2024-01-01T17:19:59.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Fix stalled code execution","shortMessageHtmlLink":"Fix stalled code execution"}},{"before":"27dbbcb31ac0a63a224cea1322951f99aa9cab5e","after":"51b23904afbdfa742926d2a8c475901a94a83061","ref":"refs/heads/main","pushedAt":"2024-01-01T16:59:58.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Only log predictions from main process","shortMessageHtmlLink":"Only log predictions from main process"}},{"before":"e991fd776e3b9b49d7ca76ea766993094b83d951","after":"27dbbcb31ac0a63a224cea1322951f99aa9cab5e","ref":"refs/heads/main","pushedAt":"2024-01-01T02:21:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Strip whitespace from text_column_names","shortMessageHtmlLink":"Strip whitespace from text_column_names"}},{"before":"f723d18a6624a43a4570f2d4fa5b6889a54a5373","after":"e991fd776e3b9b49d7ca76ea766993094b83d951","ref":"refs/heads/main","pushedAt":"2023-12-31T16:44:33.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add slurm script","shortMessageHtmlLink":"Add slurm script"}},{"before":"f912ee3ae60488bb5a6fdd6aa34e62f256da326d","after":"f723d18a6624a43a4570f2d4fa5b6889a54a5373","ref":"refs/heads/main","pushedAt":"2023-12-31T15:36:16.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Add LoRA CLM script","shortMessageHtmlLink":"Add LoRA CLM script"}},{"before":"15078cd260ab3c06fb6ed9d408d233bfaa449cfc","after":"f912ee3ae60488bb5a6fdd6aa34e62f256da326d","ref":"refs/heads/main","pushedAt":"2023-11-07T19:14:00.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update train.slurm","shortMessageHtmlLink":"Update train.slurm"}},{"before":"88333af5b9f46e8ef76092507b8f26df4867cd23","after":"15078cd260ab3c06fb6ed9d408d233bfaa449cfc","ref":"refs/heads/main","pushedAt":"2023-11-07T14:27:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"andstor","name":"André Storhaug","path":"/andstor","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/21249611?s=80&v=4"},"commit":{"message":"Update train.slurm","shortMessageHtmlLink":"Update train.slurm"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAESu8E1gA","startCursor":null,"endCursor":null}},"title":"Activity · andstor/language-modeling"}