from seekrai.types.finetune import FineTuneType
from seekrai.types import TrainingConfig, InfrastructureConfig
from seekrai import SeekrFlow
client = SeekrFlow()
training_config = TrainingConfig(
training_files=["<your-preference-fine-tuning-file-id>"],
model="meta-llama/Llama-3.2-1B",
n_epochs=1,
n_checkpoints=1,
batch_size=8,
learning_rate=1e-5,
experiment_name="dpo-fine-tune-job",
fine_tune_type=FineTuneType.PREFERENCE,
beta=0.5,
)
infrastructure_config = InfrastructureConfig(
accel_type="MI300X",
n_accel=8,
)
fine_tune = client.fine_tuning.create(
training_config=training_config,
infrastructure_config=infrastructure_config,
project_id=123,
)
print(fine_tune.id)