Skip to content

Commit

Permalink
Fix bugs
Browse files Browse the repository at this point in the history
  • Loading branch information
juberti committed Oct 17, 2024
1 parent 9bd8e4b commit e29f0d1
Show file tree
Hide file tree
Showing 3 changed files with 5 additions and 5 deletions.
4 changes: 2 additions & 2 deletions ultravox/data/datasets.py
Original file line number Diff line number Diff line change
Expand Up @@ -401,11 +401,11 @@ def __iter__(self):
actual_length += 1
if actual_length == len(self) + 1:
warnings.warn(
f"The presumed length {self._length} has been exceeded for split {self._dataset.split}. Make sure to update."
f"The presumed length {self._length} has been exceeded for {self._config.name}:{self._args.split}. Make sure to update."
)
if actual_length != len(self):
warnings.warn(
f"Mismatch between presumed length ({self._length}) and actual length ({actual_length}) for split {self._dataset.split}. Make sure to update."
f"Mismatch between presumed length ({self._length}) and actual length ({actual_length}) for {self._config.name}:{self._args.split}. Make sure to update."
)

@abc.abstractmethod
Expand Down
2 changes: 1 addition & 1 deletion ultravox/training/configs/meta_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ train_sets:
- name: gigaspeech
val_sets:
- name: gigaspeech
- weight: 0.1
- weight: 0.01
stop_strategy: "LAST_EXHAUSTED"

train_on_inputs: False
Expand Down
4 changes: 2 additions & 2 deletions ultravox/training/configs/release_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ loss_config:
train_sets:
- name: librispeech-clean-continuation
- name: librispeech-other-continuation
- name: peoplespeech-continuation
- name: peoplespeech-clean-continuation
weight: 8
- name: common-voice-en-continuation
weight: 8
Expand Down Expand Up @@ -56,7 +56,7 @@ train_sets:
weight: 0.02

# Temporarily remove heysquad_human from val_sets as it causes the training to fail.
val_sets: ["peoplespeech"]
val_sets: ["peoplespeech-clean"]

batch_size: 24
max_steps: 14400 # x8x24 = 2,764,800

0 comments on commit e29f0d1

Please sign in to comment.