Skip to content

Commit 6af01e4

Browse files
committed
updates to config names and desc.
1 parent 80584e7 commit 6af01e4

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

fast_llm/data/preparator/gpt_memmap/config.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -112,21 +112,21 @@ def _validate(self) -> None:
112112
@config_class
113113
class LossMaskSpansConfig(Config):
114114
masking_column: str = Field(
115-
default=None,
116-
desc="Field containing character spans to mask for loss computation",
117-
hint=FieldHint.optional,
115+
default="",
116+
desc="Field containing (input) character spans for loss masking",
117+
hint=FieldHint.core,
118118
)
119119
loss_masking_spans: str = Field(
120120
default="fast_llm_loss_masking_spans",
121-
desc="Field containing character spans to mask for loss computation",
121+
desc="Column name of field that would contain the masked spans.",
122122
hint=FieldHint.optional,
123123
)
124124
def _validate(self) -> None:
125125
assert isinstance(self.loss_masking_spans, str), "loss_masking_spans col name must be a string."
126126
super()._validate()
127127

128128
@config_class
129-
class FieldCombinePreparatorConfig(Config):
129+
class CombineFieldsConfig(Config):
130130
col_names: typing.List[str] = Field(
131131
default_factory=list,
132132
desc="Fields of the dataset to combine.",
@@ -205,7 +205,7 @@ class GPTMemmapDatasetPreparatorConfig(DatasetPreparatorConfig):
205205
" Does not shuffle samples.",
206206
hint=FieldHint.optional,
207207
)
208-
combine_fields: FieldCombinePreparatorConfig = Field(
208+
combine_fields: CombineFieldsConfig = Field(
209209
default=None,
210210
desc="Combine all files into a single file.",
211211
hint=FieldHint.optional,

0 commit comments

Comments
 (0)