Skip to content
Snippets Groups Projects
Commit cbce455c authored by Solene Tarride's avatar Solene Tarride
Browse files

Improve documentation

parent cc906400
No related branches found
No related tags found
No related merge requests found
......@@ -503,10 +503,9 @@ class CTCLanguageDecoder:
nbest=1,
)
self.temperature = temperature
self.tokens_to_idx = read_txt(tokens_path).split("\n")
self.ctc_id = self.tokens_to_idx.index(blank_token)
self.space_token = sil_token
self.tokens_to_idx = read_txt(tokens_path).split("\n")
self.blank_id = self.tokens_to_idx.index(blank_token)
def add_ctc_frames(self, batch_features):
"""
......@@ -514,16 +513,19 @@ class CTCLanguageDecoder:
"""
batch_size, n_frames, n_tokens = batch_features.shape
# column with 1 probability on CTC token
# Create tensor with high probability CTC token
high_prob = 0.99
low_prob = 0.01
ctc_probs = (
torch.ones((batch_size, 1, n_tokens), dtype=torch.float32)
* 0.01
* low_prob
/ (n_tokens - 1)
)
ctc_probs[:, :, self.ctc_id] = 0.99
ctc_probs[:, :, self.blank_id] = high_prob
ctc_probs = ctc_probs.log()
for i in range(n_frames - 1):
# Insert CTC tensor between frames
for i in range(n_frames):
batch_features = torch.cat(
[
batch_features[:, : 2 * i + 1, :],
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment