Ar4ikov commited on
Commit
6b4e503
1 Parent(s): 7b02c92

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -9,6 +9,7 @@ import torchaudio
9
  from transformers import AutoConfig, AutoModel, Wav2Vec2FeatureExtractor
10
  import librosa
11
  import numpy as np
 
12
 
13
 
14
  def speech_file_to_array_fn(path, sampling_rate):
@@ -42,7 +43,9 @@ model.to(device)
42
 
43
 
44
  def transcribe(audio):
45
- return predict(audio, 16000)
 
 
46
 
47
 
48
  def get_asr_interface():
 
9
  from transformers import AutoConfig, AutoModel, Wav2Vec2FeatureExtractor
10
  import librosa
11
  import numpy as np
12
+ import subprocess
13
 
14
 
15
  def speech_file_to_array_fn(path, sampling_rate):
 
43
 
44
 
45
  def transcribe(audio):
46
+ command = f"sox -t wav {audio} -r 16000 -b 16 c_{audio} channels 1"
47
+ subprocess.call(command, shell=False)
48
+ return predict(f"c_{audio}", 16000)
49
 
50
 
51
  def get_asr_interface():