|
19 | 19 | speaker: "speaker1" | "speaker2";
|
20 | 20 | content: string;
|
21 | 21 | type: "narrative" | "reaction" | "question";
|
22 |
| - blank_duration?: number; // Time in seconds (0.1, 0.2, 0.3, or 0.5) for silence after speaking |
| 22 | + blank_duration?: number; // Time in seconds (0.1, 0.2, or 0.5) for silence after speaking |
23 | 23 | }>;
|
24 | 24 | }
|
25 | 25 | ]]>
|
|
33 | 33 | Supporting role. Asks questions, reacts to speaker1's statements and helps clarify points.
|
34 | 34 | </speaker2>
|
35 | 35 | </speaker-roles>
|
36 |
| - <guidelines> |
37 |
| - - Follow the PlannerAgent's instructions for each section. |
38 |
| - - Use colloquial language and occasional filler words for natural dialogue. |
39 |
| - - Start each section with a natural transition from the previous one. |
40 |
| - - Don't say "let's start" or "let's continue". Avoid saying things like "On the next section, we |
41 |
| - will..." |
42 |
| - - Avoid formal introductions or conclusions for sections/segments. |
43 |
| - - Allow speakers to ask and answer questions naturally. |
44 |
| - - Create ${min_segments}-${max_segments} segments per section, with a mix of short and long segments. |
45 |
| - - Include some very short segments (1-2 words) for quick interactions and expressing emotions or |
46 |
| - reactions. For example: "Yeah.", "Right?", "So cool." |
47 |
| - - Use pauses (blank_duration) where appropriate. |
48 |
| - - Don't use emojis in the script. |
49 |
| - - Don't add any metadata about emotions or laughter in the script. |
50 |
| - </guidelines> |
| 36 | + <instructions> |
| 37 | + <instruction>Follow the PlannerAgent's instructions for each section.</instruction> |
| 38 | + <instruction>Use colloquial language and occasional filler words for natural dialogue.</instruction> |
| 39 | + <instruction>Start each section with a natural transition from the previous one.</instruction> |
| 40 | + <instruction>Don't say "let's start" or "let's continue". Avoid saying things like "On the next |
| 41 | + section, we will..."</instruction> |
| 42 | + <instruction>Avoid formal introductions or conclusions for sections/segments.</instruction> |
| 43 | + <instruction>Allow speakers to ask and answer questions naturally.</instruction> |
| 44 | + <instruction>Create ${min_segments}-${max_segments} segments per section, with a mix of short |
| 45 | + and |
| 46 | + long segments.</instruction> |
| 47 | + <instruction>Include some very short segments (1-2 words) for quick interactions and expressing |
| 48 | + emotions or reactions. For example: "Yeah.", "Right?", "So cool."</instruction> |
| 49 | + <instruction>Use pauses (blank_duration) where appropriate.</instruction> |
| 50 | + <instruction>Introduce the topics slowly, don't talk about the last topic in the introductions.</instruction> |
| 51 | + <instruction>Don't use emojis in the script.</instruction> |
| 52 | + <instruction>Don't add any metadata about emotions or laughter in the script.</instruction> |
| 53 | + </instructions> |
51 | 54 | <conversation-example>
|
52 | 55 | <![CDATA[
|
53 | 56 | {
|
|
64 | 67 | "speaker": "speaker2",
|
65 | 68 | "content": "Hold on tight, because...",
|
66 | 69 | "type": "reaction",
|
67 |
| - "blank_duration": 0.3 |
| 70 | + "blank_duration": 0.2 |
68 | 71 | },
|
69 | 72 | {
|
70 | 73 | "speaker": "speaker1",
|
|
76 | 79 | "speaker": "speaker2",
|
77 | 80 | "content": "That's right.",
|
78 | 81 | "type": "reaction",
|
79 |
| - "blank_duration": 0.3 |
| 82 | + "blank_duration": 0.2 |
80 | 83 | },
|
81 | 84 | {
|
82 | 85 | "speaker": "speaker1",
|
83 | 86 | "content": "And it's awesome. There are a lot of cheating accusations, so this is going to be fun.",
|
84 | 87 | "type": "narrative",
|
85 |
| - "blank_duration": 0.3 |
| 88 | + "blank_duration": 0.2 |
86 | 89 | },
|
87 | 90 | {
|
88 | 91 | "speaker": "speaker2",
|
89 | 92 | "content": "It always is, isn't it?",
|
90 | 93 | "type": "question",
|
91 |
| - "blank_duration": 0.3 |
| 94 | + "blank_duration": 0.2 |
92 | 95 | },
|
93 | 96 | {
|
94 | 97 | "speaker": "speaker1",
|
|
112 | 115 | "speaker": "speaker2",
|
113 | 116 | "content": "Exactly, it's part of the fun. We're trying to figure out what's going on in real-time.",
|
114 | 117 | "type": "narrative",
|
115 |
| - "blank_duration": 0.3 |
| 118 | + "blank_duration": 0.2 |
116 | 119 | },
|
117 | 120 | {
|
118 | 121 | "speaker": "speaker1",
|
119 | 122 | "content": "So the first line that caught my attention was... It seems to say \"look, they taught it from the CBA\". Well, I'm not sure what all that means, but...",
|
120 | 123 | "type": "narrative",
|
121 |
| - "blank_duration": 0.3 |
| 124 | + "blank_duration": 0.2 |
122 | 125 | },
|
123 | 126 | {
|
124 | 127 | "speaker": "speaker2",
|
125 | 128 | "content": "Yeah, CBA could be some kind of game or maybe a particular version of the game, a map, or a custom game mode. It gives us a bit more context.",
|
126 | 129 | "type": "narrative",
|
127 |
| - "blank_duration": 0.3 |
| 130 | + "blank_duration": 0.2 |
128 | 131 | },
|
129 | 132 | {
|
130 | 133 | "speaker": "speaker1",
|
|
136 | 139 | "speaker": "speaker2",
|
137 | 140 | "content": "Totally. We need more information to be our guide in this chat.",
|
138 | 141 | "type": "narrative",
|
139 |
| - "blank_duration": 0.3 |
| 142 | + "blank_duration": 0.2 |
140 | 143 | },
|
141 | 144 | {
|
142 | 145 | "speaker": "speaker1",
|
|
154 | 157 | "speaker": "speaker1",
|
155 | 158 | "content": "Yeah.",
|
156 | 159 | "type": "reaction",
|
157 |
| - "blank_duration": 0.3 |
| 160 | + "blank_duration": 0.2 |
158 | 161 | },
|
159 | 162 | {
|
160 | 163 | "speaker": "speaker2",
|
|
0 commit comments