pitch_utils.py 1.3 KB

12345678910111213141516171819202122232425262728293031323334353637
  1. import numpy as np
  2. import torch
  3. f0_bin = 256
  4. f0_max = 1100.0
  5. f0_min = 50.0
  6. f0_mel_min = 1127 * np.log(1 + f0_min / 700)
  7. f0_mel_max = 1127 * np.log(1 + f0_max / 700)
  8. def coarse_to_f0(coarse):
  9. uv = coarse == 1
  10. f0_mel = (coarse - 1) * (f0_mel_max - f0_mel_min) / (f0_bin - 2) + f0_mel_min
  11. f0 = ((f0_mel / 1127).exp() - 1) * 700
  12. f0[uv] = 0
  13. return f0
  14. def f0_to_coarse(f0):
  15. is_torch = isinstance(f0, torch.Tensor)
  16. f0_mel = 1127 * (1 + f0 / 700).log() if is_torch else 1127 * np.log(1 + f0 / 700)
  17. f0_mel[f0_mel > 0] = (f0_mel[f0_mel > 0] - f0_mel_min) * (f0_bin - 2) / (f0_mel_max - f0_mel_min) + 1
  18. f0_mel[f0_mel <= 1] = 1
  19. f0_mel[f0_mel > f0_bin - 1] = f0_bin - 1
  20. f0_coarse = (f0_mel + 0.5).long() if is_torch else np.rint(f0_mel).astype(np.int_)
  21. assert f0_coarse.max() <= 255 and f0_coarse.min() >= 1, (f0_coarse.max(), f0_coarse.min(), f0.min(), f0.max())
  22. return f0_coarse
  23. def norm_f0(f0, uv, hparams):
  24. is_torch = isinstance(f0, torch.Tensor)
  25. if hparams['pitch_norm'] == 'standard':
  26. f0 = (f0 - hparams['f0_mean']) / hparams['f0_std']
  27. if hparams['pitch_norm'] == 'log':
  28. f0 = torch.log2(f0 + 1e-8) if is_torch else np.log2(f0 + 1e-8)
  29. if uv is not None and hparams['use_uv']:
  30. f0[uv > 0] = 0
  31. return f0