diff --git a/users/zeyer/experiments/exp2024_04_23_baselines/ctc_recog_ext.py b/users/zeyer/experiments/exp2024_04_23_baselines/ctc_recog_ext.py index b9b1f351b..0f6804d6d 100644 --- a/users/zeyer/experiments/exp2024_04_23_baselines/ctc_recog_ext.py +++ b/users/zeyer/experiments/exp2024_04_23_baselines/ctc_recog_ext.py @@ -129,6 +129,29 @@ def py(): "lm_state_lru_initial_cache_size": 2**16, }, ), + ( + "beam4-beamToken16-cache1024", + { + "n_best": 16, + "beam_size": 4, + "beam_size_token": 16, + "beam_threshold": 14, + "batch_size": 5_000 * ctc_model.definition.batch_size_factor, + "torch_amp": {"dtype": "bfloat16"}, + "lm_state_lru_initial_cache_size": 1024, + }, + ), + ( + "beam4-beamToken16-cache1024-f32", + { + "n_best": 16, + "beam_size": 4, + "beam_size_token": 16, + "beam_threshold": 14, + "batch_size": 5_000 * ctc_model.definition.batch_size_factor, + "lm_state_lru_initial_cache_size": 1024, + }, + ), ]: res = recog_model( task=task,