diff --git a/src/finetuning/config/model_loading_params.yaml b/src/finetuning/config/model_loading_params.yaml new file mode 100644 index 0000000..5dde489 --- /dev/null +++ b/src/finetuning/config/model_loading_params.yaml @@ -0,0 +1,4 @@ +model_loading_params: + max_seq_length: 2048 + dtype: null # Auto detection of dtype + load_in_4bit: true # Reduce memory usage with 4-bit quantization