|
| | accuracy | bits | clip | dataset | method | model | params | peak_mem_alloc_mb | peak_mem_reserv_mb | perplexity | time_ms | wer | |
|
|---:|-----------:|-------:|-------:|:------------|:---------|:--------|:-----------------|--------------------:|---------------------:|-------------:|----------:|-------:| |
|
| 0 | 0 | 4 | 0 | librispeech | comb_18 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 18.0211 | 1 | |
|
| 1 | 0 | 5 | 0 | librispeech | comb_18 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 18.0211 | 1 | |
|
| 2 | 0 | 6 | 0 | librispeech | comb_18 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 18.0211 | 1 | |
|
| 3 | 0 | 7 | 0 | librispeech | comb_18 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 18.0211 | 1 | |
|
| 4 | 0 | 8 | 0 | librispeech | comb_18 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 18.0211 | 1 | |
|
| 5 | 0 | 4 | 0 | librispeech | comb_9 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 21.512 | 1 | |
|
| 6 | 0 | 5 | 0 | librispeech | comb_9 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 21.512 | 1 | |
|
| 7 | 0 | 6 | 0 | librispeech | comb_9 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 21.512 | 1 | |
|
| 8 | 0 | 7 | 0 | librispeech | comb_9 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 21.512 | 1 | |
|
| 9 | 0 | 8 | 0 | librispeech | comb_9 | wav2vec | rnd_search_t_lin | 534.743 | 1692.4 | 0 | 21.512 | 1 | |
|
| 10 | 0 | 4 | 0 | librispeech | comb_11 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 23.967 | 1 | |
|
| 11 | 0 | 5 | 0 | librispeech | comb_11 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 23.967 | 1 | |
|
| 12 | 0 | 6 | 0 | librispeech | comb_11 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 23.967 | 1 | |
|
| 13 | 0 | 4 | 0 | librispeech | comb_3 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.5325 | 1 | |
|
| 14 | 0 | 5 | 0 | librispeech | comb_3 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.5325 | 1 | |
|
| 15 | 0 | 6 | 0 | librispeech | comb_3 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.5325 | 1 | |
|
| 16 | 0 | 7 | 0 | librispeech | comb_3 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.5325 | 1 | |
|
| 17 | 0 | 8 | 0 | librispeech | comb_3 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.5325 | 1 | |
|
| 18 | 0 | 4 | 0 | librispeech | comb_7 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.6512 | 1 | |
|
| 19 | 0 | 5 | 0 | librispeech | comb_7 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.6512 | 1 | |
|
| 20 | 0 | 6 | 0 | librispeech | comb_7 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.6512 | 1 | |
|
| 21 | 0 | 7 | 0 | librispeech | comb_7 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.6512 | 1 | |
|
| 22 | 0 | 8 | 0 | librispeech | comb_7 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 24.6512 | 1 | |
|
| 23 | 0 | 4 | 0 | librispeech | comb_10 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 28.4174 | 1 | |
|
| 24 | 0 | 5 | 0 | librispeech | comb_10 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 28.4174 | 1 | |
|
| 25 | 0 | 6 | 0 | librispeech | comb_10 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 28.4174 | 1 | |
|
| 26 | 0 | 7 | 0 | librispeech | comb_10 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 28.4174 | 1 | |
|
| 27 | 0 | 8 | 0 | librispeech | comb_10 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 28.4174 | 1 | |
|
| 28 | 0 | 4 | 0 | librispeech | comb_0 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 47.0386 | 1 | |
|
| 29 | 0 | 5 | 0 | librispeech | comb_0 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 47.0386 | 1 | |
|
| 30 | 0 | 6 | 0 | librispeech | comb_0 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 47.0386 | 1 | |
|
| 31 | 0 | 7 | 0 | librispeech | comb_0 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 47.0386 | 1 | |
|
| 32 | 0 | 8 | 0 | librispeech | comb_0 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 47.0386 | 1 | |
|
| 33 | 0 | 4 | 0 | librispeech | comb_4 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 72.3838 | 1 | |
|
| 34 | 0 | 5 | 0 | librispeech | comb_4 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 72.3838 | 1 | |
|
| 35 | 0 | 6 | 0 | librispeech | comb_4 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 72.3838 | 1 | |
|
| 36 | 0 | 7 | 0 | librispeech | comb_4 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 72.3838 | 1 | |
|
| 37 | 0 | 8 | 0 | librispeech | comb_4 | wav2vec | rnd_search_t_lin | 535.632 | 1692.4 | 0 | 72.3838 | 1 | |
|
| 38 | 0 | 4 | 0 | librispeech | comb_5 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0343 | 1 | |
|
| 39 | 0 | 5 | 0 | librispeech | comb_5 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0343 | 1 | |
|
| 40 | 0 | 6 | 0 | librispeech | comb_5 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0343 | 1 | |
|
| 41 | 0 | 7 | 0 | librispeech | comb_5 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0343 | 1 | |
|
| 42 | 0 | 8 | 0 | librispeech | comb_5 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0343 | 1 | |
|
| 43 | 0 | 4 | 0 | librispeech | comb_15 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0354 | 1 | |
|
| 44 | 0 | 5 | 0 | librispeech | comb_15 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0354 | 1 | |
|
| 45 | 0 | 6 | 0 | librispeech | comb_15 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0354 | 1 | |
|
| 46 | 0 | 7 | 0 | librispeech | comb_15 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0354 | 1 | |
|
| 47 | 0 | 8 | 0 | librispeech | comb_15 | wav2vec | rnd_search_t_lin | 368.001 | 1700.79 | 0 | 0.0354 | 1 | |
|
| 48 | 0 | 7 | 0 | librispeech | comb_16 | wav2vec | rnd_search_t_lin | 658.018 | 4888.46 | 0 | 19.4757 | 0.024 | |
|
| 49 | 0 | 5 | 0 | librispeech | comb_16 | wav2vec | rnd_search_t_lin | 658.018 | 4888.46 | 0 | 19.8348 | 0.0235 | |
|
| 50 | 0 | 4 | 0 | librispeech | comb_16 | wav2vec | rnd_search_t_lin | 658.018 | 4888.46 | 0 | 20.94 | 0.0262 | |
|
| 51 | 0 | 8 | 0 | librispeech | comb_16 | wav2vec | rnd_search_t_lin | 658.018 | 4888.46 | 0 | 46.4522 | 0.0239 | |
|
| 52 | 0 | 6 | 0 | librispeech | comb_16 | wav2vec | rnd_search_t_lin | 658.018 | 4888.46 | 0 | 71.1464 | 0.0235 | |
|
| 53 | 0 | 8 | 0 | librispeech | ao_woq | wav2vec | fixed | 658.018 | 4890.56 | 0 | 22.0491 | 0.024 | |
|
| 54 | 0 | 6 | 0 | librispeech | woq | wav2vec | fixed | 658.092 | 4890.56 | 0 | 20.8031 | 0.0234 | |
|
| 55 | 0 | 8 | 0 | librispeech | woq | wav2vec | fixed | 658.092 | 4890.56 | 0 | 21.4152 | 0.0239 | |
|
| 56 | 0 | 4 | 0 | librispeech | woq | wav2vec | fixed | 658.092 | 4890.56 | 0 | 21.5442 | 0.0269 | |
|
| 57 | 0 | 7 | 0 | librispeech | woq | wav2vec | fixed | 658.092 | 4890.56 | 0 | 21.6689 | 0.0236 | |
|
| 58 | 0 | 5 | 0 | librispeech | woq | wav2vec | fixed | 658.092 | 4890.56 | 0 | 22.4333 | 0.0237 | |
|
| 59 | 0 | 7 | 0 | librispeech | comb_13 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 26.8275 | 0.0243 | |
|
| 60 | 0 | 5 | 0 | librispeech | comb_13 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 26.8548 | 0.0269 | |
|
| 61 | 0 | 8 | 0 | librispeech | comb_2 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.128 | 0.0245 | |
|
| 62 | 0 | 7 | 0 | librispeech | comb_8 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.2829 | 0.024 | |
|
| 63 | 0 | 4 | 0 | librispeech | comb_8 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.3838 | 0.0255 | |
|
| 64 | 0 | 6 | 0 | librispeech | comb_8 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.517 | 0.0235 | |
|
| 65 | 0 | 6 | 0 | librispeech | comb_13 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.5689 | 0.0248 | |
|
| 66 | 0 | 8 | 0 | librispeech | comb_8 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.6606 | 0.0241 | |
|
| 67 | 0 | 5 | 0 | librispeech | comb_8 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 27.7394 | 0.0233 | |
|
| 68 | 0 | 4 | 0 | librispeech | comb_2 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.0362 | 0.0263 | |
|
| 69 | 0 | 7 | 0 | librispeech | comb_2 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.0703 | 0.0241 | |
|
| 70 | 0 | 8 | 0 | librispeech | comb_11 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.1962 | 0.1471 | |
|
| 71 | 0 | 4 | 0 | librispeech | comb_13 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.3553 | 0.0382 | |
|
| 72 | 0 | 5 | 0 | librispeech | comb_2 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.4327 | 0.0243 | |
|
| 73 | 0 | 6 | 0 | librispeech | comb_2 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 28.5917 | 0.0247 | |
|
| 74 | 0 | 8 | 0 | librispeech | comb_1 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 29.079 | 0.0239 | |
|
| 75 | 0 | 6 | 0 | librispeech | comb_1 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 29.0882 | 0.0235 | |
|
| 76 | 0 | 7 | 0 | librispeech | comb_1 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 29.2758 | 0.0235 | |
|
| 77 | 0 | 4 | 0 | librispeech | comb_1 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 29.5703 | 0.0251 | |
|
| 78 | 0 | 5 | 0 | librispeech | comb_1 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 29.6607 | 0.0238 | |
|
| 79 | 0 | 5 | 0 | librispeech | comb_6 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 31.6555 | 0.0233 | |
|
| 80 | 0 | 6 | 0 | librispeech | comb_6 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 32.0734 | 0.0242 | |
|
| 81 | 0 | 4 | 0 | librispeech | comb_6 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 32.2841 | 0.0242 | |
|
| 82 | 0 | 8 | 0 | librispeech | comb_6 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 32.3467 | 0.0246 | |
|
| 83 | 0 | 7 | 0 | librispeech | comb_6 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 32.5395 | 0.0244 | |
|
| 84 | 0 | 7 | 0 | librispeech | comb_11 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 100.575 | 0.0268 | |
|
| 85 | 0 | 8 | 0 | librispeech | comb_13 | wav2vec | rnd_search_t_lin | 658.907 | 4890.56 | 0 | 101.573 | 0.0238 | |
|
| 86 | 0 | 32 | 0 | librispeech | base | wav2vec | ---- | 1564.77 | 5620.37 | 0 | 15.8763 | 0.0239 | |