{"payload":{"feedbackUrl":"https://github.com/orgs/community/discussions/53140","repo":{"id":621409961,"defaultBranch":"main","name":"llama-trl","ownerLogin":"jasonvanf","currentUserCanPush":false,"isFork":false,"isEmpty":false,"createdAt":"2023-03-30T15:50:56.000Z","ownerAvatar":"https://avatars.githubusercontent.com/u/24243477?v=4","public":true,"private":false,"isOrgOwned":false},"refInfo":{"name":"","listCacheKey":"v0:1680191457.3654249","currentOid":""},"activityList":{"items":[{"before":"1b03699d0007fa14aa560558a23f29b9735af6a2","after":"f2807551d1e663698d6f8fb32a2f7866ad986c7a","ref":"refs/heads/main","pushedAt":"2023-05-23T02:28:17.099Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Increase the flexibility of parameters in the training reward model","shortMessageHtmlLink":"Increase the flexibility of parameters in the training reward model"}},{"before":"763725fd83b73686c881cda6d3fd5450ee0f0f45","after":"1b03699d0007fa14aa560558a23f29b9735af6a2","ref":"refs/heads/main","pushedAt":"2023-05-22T09:47:12.189Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Format the model training code for better readability","shortMessageHtmlLink":"Format the model training code for better readability"}},{"before":"397e700a37e7ed7dd30140d5dc9747f5859d41a0","after":"763725fd83b73686c881cda6d3fd5450ee0f0f45","ref":"refs/heads/main","pushedAt":"2023-05-22T08:58:58.853Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Added support for `resume_from_checkpoint`","shortMessageHtmlLink":"Added support for resume_from_checkpoint"}},{"before":"34520d2bff4de2802ab048348a4b7c0988cf768d","after":"397e700a37e7ed7dd30140d5dc9747f5859d41a0","ref":"refs/heads/main","pushedAt":"2023-05-18T15:45:36.201Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Keep the maximum length consistent with 'seq_length' when setting up sft_trainer","shortMessageHtmlLink":"Keep the maximum length consistent with 'seq_length' when setting up …"}},{"before":"8ff411ad61a4eb442758387c6e924ff52ea7309b","after":"34520d2bff4de2802ab048348a4b7c0988cf768d","ref":"refs/heads/main","pushedAt":"2023-05-16T05:28:20.634Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Save model for hf trainer safely","shortMessageHtmlLink":"Save model for hf trainer safely"}},{"before":"138ba724264032c89f80121724e4137c28c80727","after":"8ff411ad61a4eb442758387c6e924ff52ea7309b","ref":"refs/heads/main","pushedAt":"2023-05-16T05:16:52.500Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Specifies the variable for the final checkpoint","shortMessageHtmlLink":"Specifies the variable for the final checkpoint"}},{"before":"ec932d75cdccd4ff2a70bbc4ef3a7a3d4cdca2b4","after":"138ba724264032c89f80121724e4137c28c80727","ref":"refs/heads/main","pushedAt":"2023-05-16T02:45:12.015Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Remove obsolete parameter layer_norm_names","shortMessageHtmlLink":"Remove obsolete parameter layer_norm_names"}},{"before":"68f61bfa2458c3f6c6e3cf3b6f47346c3bb987c9","after":"ec932d75cdccd4ff2a70bbc4ef3a7a3d4cdca2b4","ref":"refs/heads/main","pushedAt":"2023-05-16T02:38:51.583Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Full weight fine-tuning example","shortMessageHtmlLink":"Full weight fine-tuning example"}},{"before":"ea9ee750fe2dcf7ae602db0173f70c55aba3ec0c","after":"68f61bfa2458c3f6c6e3cf3b6f47346c3bb987c9","ref":"refs/heads/main","pushedAt":"2023-05-16T02:38:03.540Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Support full weight fine-tuning with DeepSpeed stage-3 (offload)","shortMessageHtmlLink":"Support full weight fine-tuning with DeepSpeed stage-3 (offload)"}},{"before":"70ab6443af792fee5bcf176f105ef4a952c12d88","after":"ea9ee750fe2dcf7ae602db0173f70c55aba3ec0c","ref":"refs/heads/main","pushedAt":"2023-05-15T08:39:58.030Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Add `warmup_ratio` and `save_total_limit` argument settings","shortMessageHtmlLink":"Add warmup_ratio and save_total_limit argument settings"}},{"before":"9ed21f3ee92001467483f687acc319e803c4f0ef","after":"70ab6443af792fee5bcf176f105ef4a952c12d88","ref":"refs/heads/main","pushedAt":"2023-05-12T08:10:14.922Z","pushType":"push","commitsCount":2,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Fix the final weights save","shortMessageHtmlLink":"Fix the final weights save"}},{"before":"937530c244ca5bc56603e5c29c8a697676ae6254","after":"9ed21f3ee92001467483f687acc319e803c4f0ef","ref":"refs/heads/main","pushedAt":"2023-05-11T15:03:00.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Separate tokenizer setting for decapoda-research","shortMessageHtmlLink":"Separate tokenizer setting for decapoda-research"}},{"before":"5da2e1747afc4aeb7f6370b950e61e5288f37d9c","after":"937530c244ca5bc56603e5c29c8a697676ae6254","ref":"refs/heads/main","pushedAt":"2023-05-10T08:38:05.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Need wandb requirement","shortMessageHtmlLink":"Need wandb requirement"}},{"before":"f6f22e0e5cc09bb435bb3944cbd5a1f83b236c0e","after":"5da2e1747afc4aeb7f6370b950e61e5288f37d9c","ref":"refs/heads/main","pushedAt":"2023-05-10T08:29:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Specification the argument action, existing or not existing is the opposite","shortMessageHtmlLink":"Specification the argument action, existing or not existing is the op…"}},{"before":"d1dadc42e785e540b660f3aafa672d2ae2906fd9","after":"f6f22e0e5cc09bb435bb3944cbd5a1f83b236c0e","ref":"refs/heads/main","pushedAt":"2023-05-09T01:49:45.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Add configurations for LoRA","shortMessageHtmlLink":"Add configurations for LoRA"}},{"before":"7d4dba3d1614a07c08387462c865451254c877b1","after":"d1dadc42e785e540b660f3aafa672d2ae2906fd9","ref":"refs/heads/main","pushedAt":"2023-05-06T15:18:27.000Z","pushType":"push","commitsCount":4,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Further supports incorrect LLaMATokenizer class and other AutoTokenizers at the same time.","shortMessageHtmlLink":"Further supports incorrect LLaMATokenizer class and other AutoTokeniz…"}},{"before":"b82c97cef6c1032bd7f17f8470d6ba8ed975f583","after":"7d4dba3d1614a07c08387462c865451254c877b1","ref":"refs/heads/main","pushedAt":"2023-05-06T15:09:40.000Z","pushType":"pr_merge","commitsCount":2,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Merge pull request #1 from dkqkxx/main\n\nfix: AutoTokenizer","shortMessageHtmlLink":"Merge pull request #1 from dkqkxx/main"}},{"before":"4302193719ec93396e17b190b8d3f2ba106b9236","after":"b82c97cef6c1032bd7f17f8470d6ba8ed975f583","ref":"refs/heads/main","pushedAt":"2023-05-06T15:02:15.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Support incorrect LLaMATokenizer class and other AutoTokenizers at the same time. Inspired by pull request #1","shortMessageHtmlLink":"Support incorrect LLaMATokenizer class and other AutoTokenizers at th…"}},{"before":"494e27e8342a9877caab515b39b1a72192151c64","after":"4302193719ec93396e17b190b8d3f2ba106b9236","ref":"refs/heads/main","pushedAt":"2023-05-06T14:36:11.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Change default value of `merge_lora`","shortMessageHtmlLink":"Change default value of merge_lora"}},{"before":"dab52a78027fd1c8b1ab3d5f753cefe9c7ce5f0a","after":"494e27e8342a9877caab515b39b1a72192151c64","ref":"refs/heads/main","pushedAt":"2023-05-06T07:26:21.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Custom `run_name` in training arguments","shortMessageHtmlLink":"Custom run_name in training arguments"}},{"before":"2c3a20e422ae0cd9e74f96a82dfdffc0ca5f50af","after":"dab52a78027fd1c8b1ab3d5f753cefe9c7ce5f0a","ref":"refs/heads/main","pushedAt":"2023-05-04T09:08:54.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Change the default `seq_length` setting","shortMessageHtmlLink":"Change the default seq_length setting"}},{"before":"fc4a72a1ff9e60cdfcee6b3c34a5fbdec24cfba1","after":"2c3a20e422ae0cd9e74f96a82dfdffc0ca5f50af","ref":"refs/heads/main","pushedAt":"2023-05-04T08:52:39.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Downgrade `transformers` to solve the torchrun error","shortMessageHtmlLink":"Downgrade transformers to solve the torchrun error"}},{"before":"484699f729c8b72f7d0d1eb18885bd5c7fcaa6fe","after":"fc4a72a1ff9e60cdfcee6b3c34a5fbdec24cfba1","ref":"refs/heads/main","pushedAt":"2023-05-04T08:47:43.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Specify the tokenizer for the llama model","shortMessageHtmlLink":"Specify the tokenizer for the llama model"}},{"before":"a7249f9f808de77ca0e6ef19a30fa2f408943478","after":"484699f729c8b72f7d0d1eb18885bd5c7fcaa6fe","ref":"refs/heads/main","pushedAt":"2023-05-04T07:27:20.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Specify the tokenizer for the llama model","shortMessageHtmlLink":"Specify the tokenizer for the llama model"}},{"before":"e72bc50fe2eaec35177e1caffe10d457644125cc","after":"a7249f9f808de77ca0e6ef19a30fa2f408943478","ref":"refs/heads/main","pushedAt":"2023-05-04T07:09:32.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Adapts to trl's official support for supervised finetuning","shortMessageHtmlLink":"Adapts to trl's official support for supervised finetuning"}},{"before":"46fc3a3ef1f6163ce6e9c5e7942eafb6d69492ec","after":"e72bc50fe2eaec35177e1caffe10d457644125cc","ref":"refs/heads/main","pushedAt":"2023-04-28T02:24:42.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Modify `device_map` parameter to support CPU/Single GPU/Multiple GPUs","shortMessageHtmlLink":"Modify device_map parameter to support CPU/Single GPU/Multiple GPUs"}},{"before":"d936fcda2ae1960d9416bdc3da4a1c140d493d76","after":"46fc3a3ef1f6163ce6e9c5e7942eafb6d69492ec","ref":"refs/heads/main","pushedAt":"2023-04-28T02:16:51.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Optimize training parameters (HF TrainingArguments)","shortMessageHtmlLink":"Optimize training parameters (HF TrainingArguments)"}},{"before":"f3ddca825e888d9e67eab076e7b5a6dd8d66ba8e","after":"d936fcda2ae1960d9416bdc3da4a1c140d493d76","ref":"refs/heads/main","pushedAt":"2023-04-28T02:00:37.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Optimize training parameters (HF TrainingArguments)","shortMessageHtmlLink":"Optimize training parameters (HF TrainingArguments)"}},{"before":"2d93f3de9e562076ed5ebbc98e58e1c52bba551d","after":"f3ddca825e888d9e67eab076e7b5a6dd8d66ba8e","ref":"refs/heads/main","pushedAt":"2023-04-27T14:37:10.000Z","pushType":"push","commitsCount":1,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"Optimize training parameters (HF TrainingArguments)","shortMessageHtmlLink":"Optimize training parameters (HF TrainingArguments)"}},{"before":"282499e9204d343a7b0550ec6b03f93f7f19ea98","after":"2d93f3de9e562076ed5ebbc98e58e1c52bba551d","ref":"refs/heads/main","pushedAt":"2023-04-27T09:51:30.000Z","pushType":"push","commitsCount":2,"pusher":{"login":"jasonvanf","name":"Jason Van","path":"/jasonvanf","primaryAvatarUrl":"https://avatars.githubusercontent.com/u/24243477?s=80&v=4"},"commit":{"message":"allows to load a dataset from a local directory or a dataset repository on the Hugging Face Hub","shortMessageHtmlLink":"allows to load a dataset from a local directory or a dataset reposito…"}}],"hasNextPage":true,"hasPreviousPage":false,"activityType":"all","actor":null,"timePeriod":"all","sort":"DESC","perPage":30,"cursor":"djE6ks8AAAADMgrk4gA","startCursor":null,"endCursor":null}},"title":"Activity · jasonvanf/llama-trl"}