You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
default=False, help="Use Whisper instead of Wav2Vec for English (defaults for Whisper for non-English)")
110
112
@click.option("--pauses", type=bool, default=False, help="Should we try to bullet each word or should we try to add pauses in between words by grouping them? Default: no pauses.", is_flag=True)
# check that the document has a media path to align to
28
28
assertdoc.media!=Noneanddoc.media.url!=None, f"We cannot forced-align something that doesn't have a media path! Provided media tier='{doc.media}'"
29
29
30
+
ifdoc.langs[0] !="eng":
31
+
warnings.warn("Looks like you are not aligning English with wav2vec; this works for a lot of Roman languages, but outside of that your milage may vary.")
32
+
30
33
# load the audio file
31
34
L.debug(f"Wave2Vec FA is loading url {doc.media.url}...")
32
35
f=self.__wav2vec.load(doc.media.url)
33
-
L.debug(f"Wave2Vec FA finished loading media.")
36
+
L.debug(f"Wav2Vec FA finished loading media.")
34
37
35
38
# collect utterances 30 secondish segments to be aligned for whisper
36
39
# we have to do this because whisper does poorly with very short segments
0 commit comments