speechbrain
/

m-ctc-t-large

Automatic Speech Recognition

Inference Endpoints

Model card Files Files and versions Community

patrickvonplaten commited on May 27, 2022

Commit

2fd6ccd

·

1 Parent(s): 426e0f2

Update README.md

Files changed (1) hide show

README.md +4 -3

README.md CHANGED Viewed

@@ -56,11 +56,12 @@ processor = MCTCTProcessor.from_pretrained("speechbrain/mctct-large")
  # load dummy dataset and read soundfiles
 ds = load_dataset("patrickvonplaten/librispeech_asr_dummy", "clean", split="validation")
-# tokenize
-input_features = processor(ds[0]["audio"]["array"], return_tensors="pt").input_features
 # retrieve logits
-logits = model(input_features).logits
 # take argmax and decode
 predicted_ids = torch.argmax(logits, dim=-1)

  # load dummy dataset and read soundfiles
 ds = load_dataset("patrickvonplaten/librispeech_asr_dummy", "clean", split="validation")
+# feature extraction
+input_features = processor(ds[0]["audio"]["array"], sampling_rate=ds[0]["audio"]["sampling_rate"], return_tensors="pt").input_features
 # retrieve logits
+with torch.no_grad():
+    logits = model(input_features).logits
 # take argmax and decode
 predicted_ids = torch.argmax(logits, dim=-1)