|
19 | 19 | speaker: "speaker1" | "speaker2"; |
20 | 20 | content: string; |
21 | 21 | type: "narrative" | "reaction" | "question"; |
22 | | - blank_duration?: number; // Time in seconds (0.1, 0.2, 0.3, or 0.5) for silence after speaking |
| 22 | + blank_duration?: number; // Time in seconds (0.1, 0.2, or 0.5) for silence after speaking |
23 | 23 | }>; |
24 | 24 | } |
25 | 25 | ]]> |
|
33 | 33 | Supporting role. Asks questions, reacts to speaker1's statements and helps clarify points. |
34 | 34 | </speaker2> |
35 | 35 | </speaker-roles> |
36 | | - <guidelines> |
37 | | - - Follow the PlannerAgent's instructions for each section. |
38 | | - - Use colloquial language and occasional filler words for natural dialogue. |
39 | | - - Start each section with a natural transition from the previous one. |
40 | | - - Don't say "let's start" or "let's continue". Avoid saying things like "On the next section, we |
41 | | - will..." |
42 | | - - Avoid formal introductions or conclusions for sections/segments. |
43 | | - - Allow speakers to ask and answer questions naturally. |
44 | | - - Create ${min_segments}-${max_segments} segments per section, with a mix of short and long segments. |
45 | | - - Include some very short segments (1-2 words) for quick interactions and expressing emotions or |
46 | | - reactions. For example: "Yeah.", "Right?", "So cool." |
47 | | - - Use pauses (blank_duration) where appropriate. |
48 | | - - Don't use emojis in the script. |
49 | | - - Don't add any metadata about emotions or laughter in the script. |
50 | | - </guidelines> |
| 36 | + <instructions> |
| 37 | + <instruction>Follow the PlannerAgent's instructions for each section.</instruction> |
| 38 | + <instruction>Use colloquial language and occasional filler words for natural dialogue.</instruction> |
| 39 | + <instruction>Start each section with a natural transition from the previous one.</instruction> |
| 40 | + <instruction>Don't say "let's start" or "let's continue". Avoid saying things like "On the next |
| 41 | + section, we will..."</instruction> |
| 42 | + <instruction>Avoid formal introductions or conclusions for sections/segments.</instruction> |
| 43 | + <instruction>Allow speakers to ask and answer questions naturally.</instruction> |
| 44 | + <instruction>Create ${min_segments}-${max_segments} segments per section, with a mix of short |
| 45 | + and |
| 46 | + long segments.</instruction> |
| 47 | + <instruction>Include some very short segments (1-2 words) for quick interactions and expressing |
| 48 | + emotions or reactions. For example: "Yeah.", "Right?", "So cool."</instruction> |
| 49 | + <instruction>Use pauses (blank_duration) where appropriate.</instruction> |
| 50 | + <instruction>Introduce the topics slowly, don't talk about the last topic in the introductions.</instruction> |
| 51 | + <instruction>Don't use emojis in the script.</instruction> |
| 52 | + <instruction>Don't add any metadata about emotions or laughter in the script.</instruction> |
| 53 | + </instructions> |
51 | 54 | <conversation-example> |
52 | 55 | <![CDATA[ |
53 | 56 | { |
|
64 | 67 | "speaker": "speaker2", |
65 | 68 | "content": "Hold on tight, because...", |
66 | 69 | "type": "reaction", |
67 | | - "blank_duration": 0.3 |
| 70 | + "blank_duration": 0.2 |
68 | 71 | }, |
69 | 72 | { |
70 | 73 | "speaker": "speaker1", |
|
76 | 79 | "speaker": "speaker2", |
77 | 80 | "content": "That's right.", |
78 | 81 | "type": "reaction", |
79 | | - "blank_duration": 0.3 |
| 82 | + "blank_duration": 0.2 |
80 | 83 | }, |
81 | 84 | { |
82 | 85 | "speaker": "speaker1", |
83 | 86 | "content": "And it's awesome. There are a lot of cheating accusations, so this is going to be fun.", |
84 | 87 | "type": "narrative", |
85 | | - "blank_duration": 0.3 |
| 88 | + "blank_duration": 0.2 |
86 | 89 | }, |
87 | 90 | { |
88 | 91 | "speaker": "speaker2", |
89 | 92 | "content": "It always is, isn't it?", |
90 | 93 | "type": "question", |
91 | | - "blank_duration": 0.3 |
| 94 | + "blank_duration": 0.2 |
92 | 95 | }, |
93 | 96 | { |
94 | 97 | "speaker": "speaker1", |
|
112 | 115 | "speaker": "speaker2", |
113 | 116 | "content": "Exactly, it's part of the fun. We're trying to figure out what's going on in real-time.", |
114 | 117 | "type": "narrative", |
115 | | - "blank_duration": 0.3 |
| 118 | + "blank_duration": 0.2 |
116 | 119 | }, |
117 | 120 | { |
118 | 121 | "speaker": "speaker1", |
119 | 122 | "content": "So the first line that caught my attention was... It seems to say \"look, they taught it from the CBA\". Well, I'm not sure what all that means, but...", |
120 | 123 | "type": "narrative", |
121 | | - "blank_duration": 0.3 |
| 124 | + "blank_duration": 0.2 |
122 | 125 | }, |
123 | 126 | { |
124 | 127 | "speaker": "speaker2", |
125 | 128 | "content": "Yeah, CBA could be some kind of game or maybe a particular version of the game, a map, or a custom game mode. It gives us a bit more context.", |
126 | 129 | "type": "narrative", |
127 | | - "blank_duration": 0.3 |
| 130 | + "blank_duration": 0.2 |
128 | 131 | }, |
129 | 132 | { |
130 | 133 | "speaker": "speaker1", |
|
136 | 139 | "speaker": "speaker2", |
137 | 140 | "content": "Totally. We need more information to be our guide in this chat.", |
138 | 141 | "type": "narrative", |
139 | | - "blank_duration": 0.3 |
| 142 | + "blank_duration": 0.2 |
140 | 143 | }, |
141 | 144 | { |
142 | 145 | "speaker": "speaker1", |
|
154 | 157 | "speaker": "speaker1", |
155 | 158 | "content": "Yeah.", |
156 | 159 | "type": "reaction", |
157 | | - "blank_duration": 0.3 |
| 160 | + "blank_duration": 0.2 |
158 | 161 | }, |
159 | 162 | { |
160 | 163 | "speaker": "speaker2", |
|
0 commit comments