faster_whisper_stt_arguments.py 2.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960
  1. from dataclasses import dataclass, field
  2. @dataclass
  3. class FasterWhisperSTTHandlerArguments:
  4. faster_whisper_stt_model_name: str = field(
  5. default="tiny.en",
  6. metadata={
  7. "help": """The pretrained Faster Whisper model to use.
  8. One of ('tiny', 'tiny.en', 'base', 'base.en', 'small', 'small.en', 'distil-small.en', 'medium', 'medium.en', 'distil-medium.en', 'large-v1', 'large-v2', 'large-v3', 'large', 'distil-large-v2', 'distil-large-v3').
  9. Default is 'small'."""
  10. },
  11. )
  12. faster_whisper_stt_device: str = field(
  13. default="auto",
  14. metadata={
  15. "help": """The device type on which the model will run.
  16. One of ('cpu', 'cuda', 'auto').
  17. Default is 'auto'."""
  18. },
  19. )
  20. faster_whisper_stt_compute_type: str = field(
  21. default="auto",
  22. metadata={
  23. "help": """The data type to use for computation.
  24. One of ('default', 'auto', 'int8', 'int8_float32', 'int8_float16', 'int8_bfloat16', 'int16', 'float16', 'float32', 'bfloat16')
  25. Default is 'auto'.
  26. Refer to 'https://opennmt.net/CTranslate2/quantization.html#quantize-on-model-loading'"""
  27. },
  28. )
  29. faster_whisper_stt_gen_max_new_tokens: int = field(
  30. default=128,
  31. metadata={
  32. "help": "The maximum number of new tokens to generate. Default is 128."
  33. },
  34. )
  35. faster_whisper_stt_gen_beam_size: int = field(
  36. default=1,
  37. metadata={
  38. "help": "The number of beams for beam search. Default is 1, implying greedy decoding."
  39. },
  40. )
  41. faster_whisper_stt_gen_return_timestamps: bool = field(
  42. default=False,
  43. metadata={
  44. "help": "Whether to return timestamps with transcriptions. Default is False."
  45. },
  46. )
  47. faster_whisper_stt_gen_task: str = field(
  48. default="transcribe",
  49. metadata={
  50. "help": "The task to perform, typically 'transcribe' for transcription. Default is 'transcribe'."
  51. },
  52. )
  53. faster_whisper_stt_gen_language: str = field(
  54. default="en",
  55. metadata={
  56. "help": "The language of the speech to transcribe. Default is 'en' for English."
  57. },
  58. )