File size: 4,801 Bytes
f50ece4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
<svg xmlns="http://www.w3.org/2000/svg" width="800" height="460" viewBox="0 0 800 460">
  <!-- Background -->
  <rect width="800" height="460" fill="#1e2430" rx="10" ry="10"/>
  
  <!-- Title -->
  <text x="400" y="50" font-family="Arial, sans-serif" font-size="26" font-weight="bold" text-anchor="middle" fill="#ffffff">TEN Turn Detection in Full-Duplex Dialogue</text>
  
  <!-- Human representation - moved left -->
  <circle cx="140" cy="230" r="50" fill="#4a90e2" opacity="0.9"/>
  <text x="140" y="235" font-family="Arial, sans-serif" font-size="20" font-weight="bold" text-anchor="middle" fill="white">Human</text>
  
  <!-- Connection to Turn Detection -->
  <path d="M190 230 C 215 230, 240 230, 265 230" stroke="#ffffff" stroke-width="3" fill="none" marker-end="url(#arrow1)"/>
  
  <!-- TEN Turn Detection container - moved left -->
  <rect x="270" y="120" width="280" height="220" rx="15" ry="15" fill="#283446" stroke="#3a4a61" stroke-width="3"/>
  <text x="410" y="150" font-family="Arial, sans-serif" font-size="22" font-weight="bold" text-anchor="middle" fill="#f1c40f">TEN Turn Detection</text>
  
  <!-- Detection States within the container -->
  <rect x="300" y="170" width="220" height="50" rx="8" ry="8" fill="#3949ab" opacity="0.8" stroke="#5465bd" stroke-width="2"/>
  <text x="410" y="200" font-family="Arial, sans-serif" font-size="18" font-weight="bold" text-anchor="middle" fill="#ffffff">Finished</text>
  
  <rect x="300" y="230" width="220" height="50" rx="8" ry="8" fill="#d81b60" opacity="0.8" stroke="#e63980" stroke-width="2"/>
  <text x="410" y="260" font-family="Arial, sans-serif" font-size="18" font-weight="bold" text-anchor="middle" fill="#ffffff">Wait</text>
  
  <rect x="300" y="290" width="220" height="50" rx="8" ry="8" fill="#8e24aa" opacity="0.8" stroke="#a040c5" stroke-width="2"/>
  <text x="410" y="320" font-family="Arial, sans-serif" font-size="18" font-weight="bold" text-anchor="middle" fill="#ffffff">Unfinished</text>
  
  <!-- Connection from TEN to AI -->
  <path d="M550 230 C 575 230, 600 230, 625 230" stroke="#ffffff" stroke-width="3" fill="none" marker-end="url(#arrow2)"/>
  
  <!-- AI response representation - moved left -->
  <circle cx="670" cy="170" r="40" fill="#9b59b6" opacity="0.9"/>
  <circle cx="670" cy="170" r="40" fill="none" stroke="#b67ad2" stroke-width="2"/>
  <text x="670" y="165" font-family="Arial, sans-serif" font-size="16" font-weight="bold" text-anchor="middle" fill="white">AI</text>
  <text x="670" y="185" font-family="Arial, sans-serif" font-size="14" text-anchor="middle" fill="white">Start Speaking</text>
  
  <circle cx="670" cy="290" r="40" fill="#9b59b6" opacity="0.9"/>
  <circle cx="670" cy="290" r="40" fill="none" stroke="#b67ad2" stroke-width="2"/>
  <text x="670" y="285" font-family="Arial, sans-serif" font-size="16" font-weight="bold" text-anchor="middle" fill="white">AI</text>
  <text x="670" y="305" font-family="Arial, sans-serif" font-size="14" text-anchor="middle" fill="white">Keep Listening</text>
  
  <!-- Connecting specific states to AI behaviors -->
  <path d="M520 195 C 555 195, 590 195, 625 170" stroke="#3949ab" stroke-width="2.5" fill="none" marker-end="url(#arrowBlue)"/>
  <path d="M520 255 C 555 255, 590 255, 625 290" stroke="#d81b60" stroke-width="2.5" fill="none" marker-end="url(#arrowPink)"/>
  <path d="M520 315 C 555 315, 590 315, 625 290" stroke="#8e24aa" stroke-width="2.5" fill="none" marker-end="url(#arrowPurple)"/>
  
  <!-- Arrow marker definitions -->
  <defs>
    <marker id="arrow1" markerWidth="12" markerHeight="12" refX="9" refY="3" orient="auto" markerUnits="strokeWidth">
      <path d="M0,0 L0,6 L9,3 z" fill="#ffffff"/>
    </marker>
    <marker id="arrow2" markerWidth="12" markerHeight="12" refX="9" refY="3" orient="auto" markerUnits="strokeWidth">
      <path d="M0,0 L0,6 L9,3 z" fill="#ffffff"/>
    </marker>
    <marker id="arrowBlue" markerWidth="12" markerHeight="12" refX="9" refY="3" orient="auto" markerUnits="strokeWidth">
      <path d="M0,0 L0,6 L9,3 z" fill="#3949ab"/>
    </marker>
    <marker id="arrowPink" markerWidth="12" markerHeight="12" refX="9" refY="3" orient="auto" markerUnits="strokeWidth">
      <path d="M0,0 L0,6 L9,3 z" fill="#d81b60"/>
    </marker>
    <marker id="arrowPurple" markerWidth="12" markerHeight="12" refX="9" refY="3" orient="auto" markerUnits="strokeWidth">
      <path d="M0,0 L0,6 L9,3 z" fill="#8e24aa"/>
    </marker>
  </defs>
  
  <!-- Mental model explanation -->
  <text x="400" y="385" font-family="Arial, sans-serif" font-size="16" font-weight="bold" text-anchor="middle" fill="#f1c40f">Speech State Analysis</text>
  <text x="400" y="415" font-family="Arial, sans-serif" font-size="14" text-anchor="middle" fill="#ffffff">Real-time classification of human speech patterns</text>
</svg>