Skip to content

Commit

Permalink
Update default config to ultravox_v0.3 (#84)
Browse files Browse the repository at this point in the history
Add a release configuration to train `ultravox-v0_3` (https://huggingface.co/fixie-ai/ultravox-v0_3). Simply run 
`mcli run -f mcloud.yaml --follow` after following the instructions in README.md
  • Loading branch information
zqhuang211 authored Aug 16, 2024
1 parent af8b459 commit b4a4fc5
Show file tree
Hide file tree
Showing 3 changed files with 47 additions and 2 deletions.
2 changes: 1 addition & 1 deletion mcloud.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,4 +14,4 @@ command: >-
env_variables:
MLFLOW_TRACKING_URI: databricks
UV_BRANCH: main
TRAIN_ARGS: --config_path ultravox/training/configs/llama3_whisper_kd.yaml
TRAIN_ARGS: --config_path ultravox/training/configs/release_config.yaml
2 changes: 1 addition & 1 deletion ultravox/training/configs/meta_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ audio_model: "facebook/wav2vec2-base-960h"

data_sets: ["gigaspeech"]
val_sets: ["heysquad_human", "anyinstruct", "soda", "peoplespeech"]
stop_strategy: "last_exhausted"
stop_strategy: "LAST_EXHAUSTED"

train_on_inputs: False
shuffle_data: True
Expand Down
45 changes: 45 additions & 0 deletions ultravox/training/configs/release_config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
# SLM with ultravox & llama3.1, trained wtih knowledge distillation.
exp_name: "ultravox-v0_3"

# Make sure to accept the license agreement on huggingface hub
text_model: "meta-llama/Meta-Llama-3.1-8B-Instruct"
audio_model: "openai/whisper-small"


loss_config:
# Choose from ["KL_Divergence", "CrossEntropy"], default is "KL_Divergence"
loss_function: "KL_Divergence"

# Temporarily remove heysquad_human from val_sets as it causes the training to fail.
val_sets: ["anyinstruct", "soda", "peoplespeech"]

batch_size: 24
max_steps: 7200 # x8x24 = 1,382,400 samples

data_sets: []
data_dicts:
- path: "fixie-ai/librispeech_asr"
name: "clean"
splits:
- "train.100" # 28_539 samples
- "train.360" # 104_014 samples
user_template: "Continue the following text using less than 50 words:\n\n<|audio|>"
assistant_template: "{{ continuation }}"
transcript_template: "{{ text }}"
weight: 1
- path: "fixie-ai/librispeech_asr"
name: "other"
splits:
- "train.500" # 148_688 samples
user_template: "Continue the following text using less than 50 words:\n\n<|audio|>"
assistant_template: "{{ continuation }}"
transcript_template: "{{ text }}"
weight: 1
- path: "fixie-ai/common_voice_17_0"
name: "en"
splits:
- "train" # 1_101_170 samples
user_template: "Continue the following text using less than 50 words:\n\n<|audio|>"
assistant_template: "{{ continuation }}"
transcript_template: "{{ text_proc.format_asr_text(sentence) }}"
weight: 8

0 comments on commit b4a4fc5

Please sign in to comment.