DEFAULT_DEVICE_ID=0 MEMORY_FRACTION=0.2 XLA_TARGET=cpu BATCH_SIZE=3 BATCH_TIMEOUT=3000 CLIENT=host # MODEL=openai/whisper-large-v3 MODEL=openai/whisper-tiny PORT=4000