Files
DS-LLM-TEMPLATE-FINETUNING/configs/completion/text_generation.yaml
T

30 lines
468 B
YAML
Raw Normal View History

2025-08-06 22:45:37 +01:00
task:
name: "completion"
type: "text_generation"
data:
source: "huggingface"
dataset_name: "wikitext-2-raw-v1"
input_field: "text"
max_length: 512
train_split: 0.8
validation_split: 0.1
test_split: 0.1
model:
name: "gpt2"
max_length: 512
training:
num_epochs: 3
batch_size: 8
learning_rate: 5e-5
weight_decay: 0.01
warmup_ratio: 0.1
lr_scheduler_type: "linear"
inference:
batch_size: 16
max_new_tokens: 100
temperature: 0.7