1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
|
using System.Globalization;
using Whisper;
namespace MicrophoneCS
{
/// <summary>Implementation of Callbacks abstract class, to print these segments as soon as they’re produced by the library.</summary>
sealed class TranscribeCallbacks: Callbacks
{
readonly CommandLineArgs args;
readonly eResultFlags resultFlags;
public TranscribeCallbacks( CommandLineArgs args )
{
this.args = args;
resultFlags = args.resultFlags();
Console.OutputEncoding = System.Text.Encoding.UTF8;
}
// Terminal color map. 10 colors grouped in ranges [0.0, 0.1, ..., 0.9]
// Lowest is red, middle is yellow, highest is green.
readonly string[] k_colors = new string[]
{
"\x1B[38;5;196m", "\x1B[38;5;202m", "\x1B[38;5;208m", "\x1B[38;5;214m", "\x1B[38;5;220m",
"\x1B[38;5;226m", "\x1B[38;5;190m", "\x1B[38;5;154m", "\x1B[38;5;118m", "\x1B[38;5;82m"
};
int colorIndex( in sToken tok )
{
float p = tok.probability;
float p3 = p * p * p;
int col = (int)( p3 * k_colors.Length );
col = Math.Clamp( col, 0, k_colors.Length - 1 );
return col;
}
public static string printTime( TimeSpan ts ) =>
ts.ToString( "hh':'mm':'ss'.'fff", CultureInfo.InvariantCulture );
public static string printTimeWithComma( TimeSpan ts ) =>
ts.ToString( "hh':'mm':'ss','fff", CultureInfo.InvariantCulture );
protected override void onNewSegment( Context sender, int countNew )
{
TranscribeResult res = sender.results( resultFlags );
ReadOnlySpan<sToken> tokens = res.tokens;
int s0 = res.segments.Length - countNew;
if( s0 == 0 )
Console.WriteLine();
for( int i = s0; i < res.segments.Length; i++ )
{
sSegment seg = res.segments[ i ];
if( args.no_timestamps )
{
if( args.print_colors && AnsiCodes.enabled )
{
foreach( sToken tok in res.getTokens( seg ) )
{
if( !args.print_special && tok.hasFlag( eTokenFlags.Special ) )
continue;
Console.Write( "{0}{1}{2}", k_colors[ colorIndex( tok ) ], tok.text, "\x1B[0m" );
}
}
else
Console.Write( seg.text );
Console.Out.Flush();
continue;
}
string speaker = "";
if( args.diarize )
{
speaker = sender.detectSpeaker( seg.time ) switch
{
eSpeakerChannel.Unsure => "(speaker ?)",
eSpeakerChannel.Left => "(speaker 0)",
eSpeakerChannel.Right => "(speaker 1)",
_ => ""
};
}
if( args.print_colors && AnsiCodes.enabled )
{
Console.Write( "[{0} --> {1}] {2} ", printTime( seg.time.begin ), printTime( seg.time.end ), speaker );
foreach( sToken tok in res.getTokens( seg ) )
{
if( !args.print_special && tok.hasFlag( eTokenFlags.Special ) )
continue;
Console.Write( "{0}{1}{2}", k_colors[ colorIndex( tok ) ], tok.text, "\x1B[0m" );
}
Console.WriteLine();
}
else
Console.WriteLine( "[{0} --> {1}] {2} {3}", printTime( seg.time.begin ), printTime( seg.time.end ), speaker, seg.text );
}
}
}
}
|