| from pywhispercpp.model import Model |
| import config |
| import soundfile |
| from pywhispercpp.utils import to_timestamp |
|
|
| mel, _, = soundfile.read("test/6_before_cut_56640.wav") |
| |
|
|
| models_dir = config.MODEL_DIR.as_posix() |
| model = Model( |
| model=config.WHISPER_MODEL, |
| models_dir=models_dir, |
| n_threads=4, |
| print_realtime=False, |
| print_progress=False, |
| print_timestamps=False, |
| translate=False, |
| temperature=0., |
| no_context=True |
| ) |
| print(mel.shape, mel.dtype) |
| segments = model.transcribe(mel, |
| |
| language='en', |
| |
| |
| token_timestamps=True, |
| max_len=1,) |
| for segment in segments: |
| print(to_timestamp(segment.t0), to_timestamp(segment.t1), segment.text) |
|
|