Skip to content

Commit

Permalink
Update LLM trainer defaults (#3840)
Browse files Browse the repository at this point in the history
  • Loading branch information
arnavgarg1 authored Dec 18, 2023
1 parent 52f124f commit aa17e08
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions ludwig/schema/trainer.py
Original file line number Diff line number Diff line change
Expand Up @@ -815,7 +815,7 @@ class LLMTrainerConfig(BaseTrainerConfig):
"""Base class for all LLM trainer configs."""

learning_rate: Union[float, str] = schema_utils.OneOfOptionsField(
default=0.0001,
default=0.0002,
allow_none=False,
description=(
"Controls how much to change the model in response to the estimated error each time the model weights are "
Expand All @@ -830,7 +830,7 @@ class LLMTrainerConfig(BaseTrainerConfig):
)

batch_size: int = schema_utils.PositiveInteger(
default=2,
default=1,
description="Batch size used for training in the LLM trainer.",
)

Expand All @@ -845,7 +845,7 @@ class LLMTrainerConfig(BaseTrainerConfig):
)

epochs: int = schema_utils.PositiveInteger(
default=1,
default=3,
description="Number of epochs to train in the LLM trainer.",
)

Expand Down Expand Up @@ -881,7 +881,7 @@ class LLMTrainerConfig(BaseTrainerConfig):
)

eval_batch_size: int = schema_utils.PositiveInteger(
default=1,
default=2,
description="Batch size used for evaluation in the LLM trainer.",
)

Expand Down

0 comments on commit aa17e08

Please sign in to comment.