FQiao's picture
Upload 70 files
3324de2 verified
raw
history blame contribute delete
684 Bytes
# Absolute paths for different resources
paths:
train_file: "data/train.json"
val_file: "data/val.json"
test_file: "data/val.json"
resume_from_checkpoint: ""
output_dir: "outputs/"
# Training-related parameters
training:
per_device_batch_size: 4
learning_rate: 5e-4
gradient_accumulation_steps: 1
num_train_epochs: 80
num_warmup_steps: 1000
max_audio_duration: 30
# Model and optimizer parameters,
model:
num_layers: 6
num_single_layers: 18
in_channels: 64
attention_head_dim: 128
joint_attention_dim: 1024
num_attention_heads: 8
audio_seq_len: 645
max_duration: 30
uncondition: false
text_encoder_name: "google/flan-t5-large"