Files
CompanionGuard-RL/code/configs/data_generation.yaml

25 lines
501 B
YAML
Raw Normal View History

api:
type: "qwen" # "qwen" or "openai"
model: "qwen-max"
generation:
total_samples: 3000
safe_ratio: 0.25 # 25% safe (y_risk=0) samples
delay: 0.5 # seconds between API calls
max_retries: 3 # retry attempts per failed generation
output:
raw_dir: "data/raw"
output_file: "data/raw/generated.jsonl"
annotation:
judge_model: "qwen-max"
output_file: "data/processed/annotated.jsonl"
delay: 0.3
split:
train: 0.8
val: 0.1
test: 0.1
seed: 42