1# The ID of the speaker who is uttering the text.
2# If the speaker is the system, the ID is SPEAKER_ID_SYSTEM.
3# An empty speaker_id is equivalent to setting it to SPEAKER_ID_UNKNOWN
4string speaker_id
5
6string SPEAKER_ID_SYSTEM = "__system__"
7string SPEAKER_ID_UNKNOWN = "__unknown__"
8
9# The text which is being spoken.
10string text
11
12# The localei of the caption, using following format:
13# the [ISO 639-1 language code](https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes),
14# lower case, followed by an underscore,
15# followed by the [ISO 3166-1 alpha-2 region code](https://en.wikipedia.org/wiki/ISO_3166-1_alpha-2),
16# upper case.
17#
18# For example, 'en_GB' specifies British English.
19string locale