# Curriculum learning configuration # Model settings model_name: "facebook/wav2vec2-base" device: "cuda" checkpoint: null # Data settings data_path: "data/raw" split_ratios: train: 0.7 val: 0.15 test: 0.15 # RL algorithm settings algorithm: "ppo" learning_rate: 0.0003 gamma: 0.99 # Reward function settings reward_weights: clarity: 0.33 naturalness: 0.33 accuracy: 0.34 # Curriculum learning settings use_curriculum: true difficulty_levels: 5 advancement_threshold: 0.8 regression_threshold: 0.5 # Training settings num_episodes: 1000 batch_size: 32 episode_length: 15 # Checkpointing checkpoint_interval: 100 checkpoint_dir: "checkpoints" max_checkpoints: 10 # Logging and monitoring log_interval: 20 log_dir: "logs" # Reproducibility random_seed: 42