Skip to content
Snippets Groups Projects
Commit 7f25f137 authored by Solene Tarride's avatar Solene Tarride
Browse files

Improve documentation

parent e9aa1084
No related branches found
No related tags found
No related merge requests found
......@@ -503,10 +503,9 @@ class CTCLanguageDecoder:
nbest=1,
)
self.temperature = temperature
self.tokens_to_idx = read_txt(tokens_path).split("\n")
self.ctc_id = self.tokens_to_idx.index(blank_token)
self.space_token = sil_token
self.tokens_to_idx = read_txt(tokens_path).split("\n")
self.blank_id = self.tokens_to_idx.index(blank_token)
def add_ctc_frames(self, batch_features):
"""
......@@ -514,16 +513,19 @@ class CTCLanguageDecoder:
"""
batch_size, n_frames, n_tokens = batch_features.shape
# column with 1 probability on CTC token
# Create tensor with high probability CTC token
high_prob = 0.99
low_prob = 0.01
ctc_probs = (
torch.ones((batch_size, 1, n_tokens), dtype=torch.float32)
* 0.01
* low_prob
/ (n_tokens - 1)
)
ctc_probs[:, :, self.ctc_id] = 0.99
ctc_probs[:, :, self.blank_id] = high_prob
ctc_probs = ctc_probs.log()
for i in range(n_frames - 1):
# Insert CTC tensor between frames
for i in range(n_frames):
batch_features = torch.cat(
[
batch_features[:, : 2 * i + 1, :],
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment