From 5c130e0c45f52e489cc5be7747f4ce32614b16c6 Mon Sep 17 00:00:00 2001 From: Hamel Husain Date: Mon, 1 Jan 2024 21:15:56 -0800 Subject: [PATCH 1/3] Update README.md --- README.md | 6 +----- 1 file changed, 1 insertion(+), 5 deletions(-) diff --git a/README.md b/README.md index 4dd80339a..ce0174245 100644 --- a/README.md +++ b/README.md @@ -643,7 +643,7 @@ max_memory: # If you want to use 'lora' or 'qlora' or leave blank to train all parameters in original model adapter: lora # If you already have a lora model trained that you want to load, put that here. -# This means after training, if you want to test the model, you should set this to the value of `lora_out_dir`. +# This means after training, if you want to test the model, you should set this to the value of `output_dir`. lora_model_dir: # LoRA hyperparameters @@ -670,10 +670,6 @@ lora_modules_to_save: # - embed_tokens # - lm_head -# Once you complete training, the model will be saved to the following directory. -# If you merge the adapter to the base model, a subdirectory `merged` will be created under this directory. -# Make sure `lora_model_dir` points to this directory if you want to use the trained model. -lora_out_dir: lora_fan_in_fan_out: false # ReLoRA configuration From 57f0f01aa5ab9f613b137e992b59774e6f6812db Mon Sep 17 00:00:00 2001 From: Hamel Husain Date: Mon, 1 Jan 2024 21:21:39 -0800 Subject: [PATCH 2/3] Update README.md --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index ce0174245..0b9499343 100644 --- a/README.md +++ b/README.md @@ -644,6 +644,7 @@ max_memory: adapter: lora # If you already have a lora model trained that you want to load, put that here. # This means after training, if you want to test the model, you should set this to the value of `output_dir`. +# Note that if you merge an adapter to the base model, a new subdirectory `merged` will be created under the original directory, which you will want to use instead. lora_model_dir: # LoRA hyperparameters From 0e1bd13057577a61a516f7bcd8a04ea3dfb20dfb Mon Sep 17 00:00:00 2001 From: Hamel Husain Date: Mon, 1 Jan 2024 22:51:17 -0800 Subject: [PATCH 3/3] Update README.md Co-authored-by: NanoCode012 --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 0b9499343..21653d027 100644 --- a/README.md +++ b/README.md @@ -644,7 +644,7 @@ max_memory: adapter: lora # If you already have a lora model trained that you want to load, put that here. # This means after training, if you want to test the model, you should set this to the value of `output_dir`. -# Note that if you merge an adapter to the base model, a new subdirectory `merged` will be created under the original directory, which you will want to use instead. +# Note that if you merge an adapter to the base model, a new subdirectory `merged` will be created under the `output_dir`. lora_model_dir: # LoRA hyperparameters