diff --git a/custom_components/requirements-dev.txt b/custom_components/requirements-dev.txt new file mode 100644 index 0000000..e2fc874 --- /dev/null +++ b/custom_components/requirements-dev.txt @@ -0,0 +1,9 @@ +# types from Home Assistant +homeassistant>=2024.6.1 +hassil +home-assistant-intents + +# testing requirements +pytest +pytest-asyncio +pytest-homeassistant-custom-component diff --git a/custom_components/requirements.txt b/custom_components/requirements.txt new file mode 100644 index 0000000..c902bbc --- /dev/null +++ b/custom_components/requirements.txt @@ -0,0 +1,2 @@ +huggingface-hub>=0.23.0 +webcolors>=24.8.0 diff --git a/data/requirements.txt b/data/requirements.txt new file mode 100644 index 0000000..876e171 --- /dev/null +++ b/data/requirements.txt @@ -0,0 +1,6 @@ +datasets>=3.2.0 +webcolors>=1.13 +pandas>=2.2.3 +deep-translator>=1.11.4 +langcodes>=3.5.0 +babel==2.15.0 \ No newline at end of file diff --git a/docs/Training.md b/docs/Training.md index c70cb04..fc51478 100644 --- a/docs/Training.md +++ b/docs/Training.md @@ -230,6 +230,22 @@ python3 train.py \ --save_steps 50 --save_total_limit 10 --eval_steps 100 --logging_steps 2 ``` +#### Llama 3.2 3B Instruct +``` +python3 generate_home_assistant_data.py --train --test --large --sharegpt --language english german french spanish + +python3 train.py \ + --run_name Home-Llama-3.2-3B-rev1 \ + --base_model meta-llama/Llama-3.2-3B-Instruct \ + --bf16 \ + --train_dataset data/home_assistant_train.jsonl \ + --test_dataset data/home_assistant_test.jsonl \ + --learning_rate 1e-5 --learning_rate_warmup 0.03 --batch_size 64 --epochs 1 \ + --micro_batch_size 2 \ + --ctx_size 2048 \ + --save_steps 200 --save_total_limit 3 --eval_steps 100 --logging_steps 2 +``` + ### Problems Training a model is not an easy thing. Therefore, we are not able to cover all the problems encountered during training. Here we will try to add known problems and solutions on how to deal with them. diff --git a/requirements.txt b/requirements.txt index db89333..e08a97f 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,28 +1,13 @@ -# training + dataset requirements -transformers -tensorboard -datasets -peft -bitsandbytes -trl -webcolors -pandas +transformers>=4.48.3 +tensorboard>=2.18.0 +datasets>=3.2.0 +peft>=0.14.0 +bitsandbytes>=0.45.2 +trl>=0.14.0 +webcolors>=1.13 +pandas>=2.2.3 # flash-attn -sentencepiece -deep-translator -langcodes -babel==2.15.0 - -# integration requirements -huggingface-hub>=0.23.0 -webcolors>=24.8.0 - -# types from Home Assistant -homeassistant>=2024.6.1 -hassil -home-assistant-intents - -# testing requirements -pytest -pytest-asyncio -pytest-homeassistant-custom-component +sentencepiece>=0.2.0 +deep-translator>=1.11.4 +langcodes>=3.5.0 +babel>=2.15.0