Fork of https://github.com/alokprasad/fastspeech_squeezewave to also fix denoising in squeezewave
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

52 lines
953 B

  1. from text import symbols
  2. # Text
  3. text_cleaners = ['english_cleaners']
  4. # Mel
  5. n_mel_channels = 80
  6. num_mels = 80
  7. # FastSpeech
  8. vocab_size = 1024
  9. N = 6
  10. Head = 2
  11. d_model = 384
  12. duration_predictor_filter_size = 256
  13. duration_predictor_kernel_size = 3
  14. dropout = 0.1
  15. word_vec_dim = 384
  16. encoder_n_layer = 6
  17. encoder_head = 2
  18. encoder_conv1d_filter_size = 1536
  19. max_sep_len = 2048
  20. encoder_output_size = 384
  21. decoder_n_layer = 6
  22. decoder_head = 2
  23. decoder_conv1d_filter_size = 1536
  24. decoder_output_size = 384
  25. fft_conv1d_kernel = 3
  26. fft_conv1d_padding = 1
  27. duration_predictor_filter_size = 256
  28. duration_predictor_kernel_size = 3
  29. dropout = 0.1
  30. # Train
  31. alignment_path = "./alignments"
  32. checkpoint_path = "./model_new"
  33. logger_path = "./logger"
  34. mel_ground_truth = "./mels"
  35. batch_size = 64
  36. epochs = 1000
  37. n_warm_up_step = 4000
  38. learning_rate = 1e-3
  39. weight_decay = 1e-6
  40. grad_clip_thresh = 1.0
  41. decay_step = [500000, 1000000, 2000000]
  42. save_step = 1000
  43. log_step = 5
  44. clear_Time = 20