{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":414203752,"defaultBranch":"main","name":"SwissArmyTransformer","ownerLogin":"THUDM","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2021-10-06T12:30:39.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/48590610?v=4","public":true,"private":false,"isOrgOwned":true},"refInfo":{"name":"","listCacheKey":"v0:1706775376.0","currentOid":""},"activityList":{"items":[{"before":"ba49482ec539813e8a59dd9d34ab5ab42429f5d1","after":"ca7999800fa01613ebdd698286e3f7f74ba59b74","ref":"refs/heads/main","pushedAt":"2024-06-12T06:50:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix deepspeed_config","shortMessageHtmlLink":"fix deepspeed_config"}},{"before":"563da31c541ad708cdad812a4e1494dff89e72db","after":"ba49482ec539813e8a59dd9d34ab5ab42429f5d1","ref":"refs/heads/main","pushedAt":"2024-05-18T17:09:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"wenyihong","name":"Wenyi Hong","path":"/wenyihong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/48993524?s=80&v=4"},"commit":{"message":"add specific iteration while loading ckpt","shortMessageHtmlLink":"add specific iteration while loading ckpt"}},{"before":"889fdfced30787641a2f5e6451d1f6380ed31df1","after":"563da31c541ad708cdad812a4e1494dff89e72db","ref":"refs/heads/main","pushedAt":"2024-05-15T09:50:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"update init","shortMessageHtmlLink":"update init"}},{"before":"1dc7fd4f86d0d3a2fa9d0de9c8abfb3cd2878b55","after":"889fdfced30787641a2f5e6451d1f6380ed31df1","ref":"refs/heads/main","pushedAt":"2024-05-04T15:54:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"update evaclip model","shortMessageHtmlLink":"update evaclip model"}},{"before":"ecc645b018b07848ec07e3c28ce070d09b961c63","after":"1dc7fd4f86d0d3a2fa9d0de9c8abfb3cd2878b55","ref":"refs/heads/main","pushedAt":"2024-04-10T03:41:56.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix simple init seed","shortMessageHtmlLink":"fix simple init seed"}},{"before":"2f24192bf50c2b1866cba3f2531f548180340a56","after":"ecc645b018b07848ec07e3c28ce070d09b961c63","ref":"refs/heads/main","pushedAt":"2024-04-08T10:06:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"wenyihong","name":"Wenyi Hong","path":"/wenyihong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/48993524?s=80&v=4"},"commit":{"message":"fix bug: metric log","shortMessageHtmlLink":"fix bug: metric log"}},{"before":"0da9a54cc20e581271410bfbc3be399d3d27f4d7","after":"2f24192bf50c2b1866cba3f2531f548180340a56","ref":"refs/heads/main","pushedAt":"2024-04-07T13:06:34.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix no_weight_decay","shortMessageHtmlLink":"fix no_weight_decay"}},{"before":"6b636367f4550c440c64bedb0399588f844b1768","after":"0da9a54cc20e581271410bfbc3be399d3d27f4d7","ref":"refs/heads/main","pushedAt":"2024-04-03T10:25:19.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"wenyihong","name":"Wenyi Hong","path":"/wenyihong","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/48993524?s=80&v=4"},"commit":{"message":"fix bug: metric report datatype","shortMessageHtmlLink":"fix bug: metric report datatype"}},{"before":"cd37f85fea7bd8e9dd29f670fd468f4dc0569b84","after":"6b636367f4550c440c64bedb0399588f844b1768","ref":"refs/heads/main","pushedAt":"2024-04-03T08:47:17.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix metric report","shortMessageHtmlLink":"fix metric report"}},{"before":"3f285cc17fd3717cf031d691f0c120ee79483aae","after":"cd37f85fea7bd8e9dd29f670fd468f4dc0569b84","ref":"refs/heads/main","pushedAt":"2024-04-03T06:57:12.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix metric report","shortMessageHtmlLink":"fix metric report"}},{"before":"d88c41adc43f31fdbc01de05a00561db4be37cee","after":"3f285cc17fd3717cf031d691f0c120ee79483aae","ref":"refs/heads/main","pushedAt":"2024-04-03T06:35:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"update metric report","shortMessageHtmlLink":"update metric report"}},{"before":"2c6edb41c531fb25a5e8f128b2c1a85b9342070e","after":"d88c41adc43f31fdbc01de05a00561db4be37cee","ref":"refs/heads/main","pushedAt":"2024-03-26T08:29:27.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix bug","shortMessageHtmlLink":"fix bug"}},{"before":"d96b271cf9bf1624a1f717594752d17b35806465","after":"2c6edb41c531fb25a5e8f128b2c1a85b9342070e","ref":"refs/heads/main","pushedAt":"2024-03-26T08:13:54.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"Merge branch 'main' of https://github.com/THUDM/SwissArmyTransformer","shortMessageHtmlLink":"Merge branch 'main' of https://github.com/THUDM/SwissArmyTransformer"}},{"before":"7f93d5c60085d1364554abd70d9e8b08615c9237","after":"d96b271cf9bf1624a1f717594752d17b35806465","ref":"refs/heads/main","pushedAt":"2024-03-22T16:53:24.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"yzy-thu","name":"yangzy_thu","path":"/yzy-thu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34501231?s=80&v=4"},"commit":{"message":"fix wandb bug","shortMessageHtmlLink":"fix wandb bug"}},{"before":"13c8f12324cac92ef8f60aad9e3c17262eda531e","after":"7f93d5c60085d1364554abd70d9e8b08615c9237","ref":"refs/heads/main","pushedAt":"2024-03-22T10:06:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"yzy-thu","name":"yangzy_thu","path":"/yzy-thu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34501231?s=80&v=4"},"commit":{"message":"fix wandb bug","shortMessageHtmlLink":"fix wandb bug"}},{"before":"2504032c170e6fffc56f78738df9474a1ea10941","after":"13c8f12324cac92ef8f60aad9e3c17262eda531e","ref":"refs/heads/main","pushedAt":"2024-03-15T14:31:53.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"yzy-thu","name":"yangzy_thu","path":"/yzy-thu","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/34501231?s=80&v=4"},"commit":{"message":"wandb support","shortMessageHtmlLink":"wandb support"}},{"before":"43a88b9ca11bcb63bec579c0091455e392a335fa","after":"2504032c170e6fffc56f78738df9474a1ea10941","ref":"refs/heads/main","pushedAt":"2024-03-14T07:34:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix data parallel wds seed","shortMessageHtmlLink":"fix data parallel wds seed"}},{"before":"dc2ad0214960cc49ffe5b01fe03365ffaf8792ec","after":"43a88b9ca11bcb63bec579c0091455e392a335fa","ref":"refs/heads/main","pushedAt":"2024-03-08T03:43:55.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"update data parallel","shortMessageHtmlLink":"update data parallel"}},{"before":"17e9b0607bb51bddd563c43a01124e347e49ce65","after":"dc2ad0214960cc49ffe5b01fe03365ffaf8792ec","ref":"refs/heads/main","pushedAt":"2024-02-29T06:11:44.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"global random seed","shortMessageHtmlLink":"global random seed"}},{"before":"99b020204f6fd722a52fd7243a0164c65f7f148d","after":"17e9b0607bb51bddd563c43a01124e347e49ce65","ref":"refs/heads/main","pushedAt":"2024-02-29T03:19:28.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix random seed","shortMessageHtmlLink":"fix random seed"}},{"before":"e1d846a7198410046311f549a83308bbc8ee7d75","after":"99b020204f6fd722a52fd7243a0164c65f7f148d","ref":"refs/heads/main","pushedAt":"2024-02-22T09:21:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix attn dropout","shortMessageHtmlLink":"fix attn dropout"}},{"before":"eb4fac918cc86b304840872d4dccaaaf1b477e37","after":"e1d846a7198410046311f549a83308bbc8ee7d75","ref":"refs/heads/main","pushedAt":"2024-02-22T06:45:29.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"add model_parallel_group option to split","shortMessageHtmlLink":"add model_parallel_group option to split"}},{"before":"4fa5eef487d7b31e9cb3d7e2e5160cde4d5e28b4","after":"eb4fac918cc86b304840872d4dccaaaf1b477e37","ref":"refs/heads/main","pushedAt":"2024-02-02T02:19:09.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix comma","shortMessageHtmlLink":"fix comma"}},{"before":"efac308cdacc96200c95f4c3429f9a029761c169","after":"4fa5eef487d7b31e9cb3d7e2e5160cde4d5e28b4","ref":"refs/heads/main","pushedAt":"2024-02-01T09:25:25.000Z","pushType":"pr_merge","commitsCount":3,"pusher":{"login":"Sleepychord","name":"Sleepy_chord","path":"/Sleepychord","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/9153807?s=80&v=4"},"commit":{"message":"Merge pull request #166 from THUDM/MoE\n\nMoE support","shortMessageHtmlLink":"Merge pull request #166 from THUDM/MoE"}},{"before":"61685a39c4ef3e9123e4a8900cf258b59f759330","after":"51062d4fbac76182da56d57aa0f4e3d72b6ad67f","ref":"refs/heads/MoE","pushedAt":"2024-02-01T08:29:07.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"fix little bug","shortMessageHtmlLink":"fix little bug"}},{"before":null,"after":"61685a39c4ef3e9123e4a8900cf258b59f759330","ref":"refs/heads/MoE","pushedAt":"2024-02-01T08:16:16.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"support MoE & Mixtral-8x7B","shortMessageHtmlLink":"support MoE & Mixtral-8x7B"}},{"before":"015743bf24bb3f352f308ad4618012bcc0889ce4","after":"28ac7de19d0fa0734ec47c0a5775c97b8881e41a","ref":"refs/heads/moe","pushedAt":"2024-02-01T08:10:05.000Z","pushType":"push","commitsCount":58,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"update moe","shortMessageHtmlLink":"update moe"}},{"before":"72ced3f56386e63582e8254955a27188e32440d2","after":"efac308cdacc96200c95f4c3429f9a029761c169","ref":"refs/heads/main","pushedAt":"2024-01-29T07:27:28.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"1049451037","name":"Qingsong Lv","path":"/1049451037","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/15194939?s=80&v=4"},"commit":{"message":"Merge pull request #165 from THUDM/fix-rotary-bug\n\nfix rotary bug when q seqlen > cos seqlen","shortMessageHtmlLink":"Merge pull request #165 from THUDM/fix-rotary-bug"}},{"before":"72ced3f56386e63582e8254955a27188e32440d2","after":"cc087ed50937bc4dceb2eb86a3b260ddb1391dbf","ref":"refs/heads/fix-rotary-bug","pushedAt":"2024-01-29T07:24:47.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"leizhao1234","name":null,"path":"/leizhao1234","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/135012196?s=80&v=4"},"commit":{"message":"fix rotary bug when q seqlen > cos seqlen","shortMessageHtmlLink":"fix rotary bug when q seqlen > cos seqlen"}},{"before":null,"after":"72ced3f56386e63582e8254955a27188e32440d2","ref":"refs/heads/fix-rotary-bug","pushedAt":"2024-01-29T06:59:04.000Z","pushType":"branch_creation","commitsCount":0,"pusher":{"login":"leizhao1234","name":null,"path":"/leizhao1234","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/135012196?s=80&v=4"},"commit":{"message":"update chatglm rotary","shortMessageHtmlLink":"update chatglm rotary"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAAEYvitZgA","startCursor":null,"endCursor":null}},"title":"Activity ยท THUDM/SwissArmyTransformer"}