{ "max_single_segment_time": 20000, "threshold": 0.7, "min_duration": 500, "speech_pad": 300 }