@misc{rfc4313, series = {Request for Comments}, number = 4313, howpublished = {RFC 4313}, publisher = {RFC Editor}, doi = {10.17487/RFC4313}, url = {https://www.rfc-editor.org/info/rfc4313}, author = {David R. Oran}, title = {{Requirements for Distributed Control of Automatic Speech Recognition (ASR), Speaker Identification/Speaker Verification (SI/SV), and Text-to-Speech (TTS) Resources}}, pagetotal = 20, year = 2005, month = dec, abstract = {This document outlines the needs and requirements for a protocol to control distributed speech processing of audio streams. By speech processing, this document specifically means automatic speech recognition (ASR), speaker recognition -- which includes both speaker identification (SI) and speaker verification (SV) -- and text-to-speech (TTS). Other IETF protocols, such as SIP and Real Time Streaming Protocol (RTSP), address rendezvous and control for generalized media streams. However, speech processing presents additional requirements that none of the extant IETF protocols address. This memo provides information for the Internet community.}, }