-
-
Notifications
You must be signed in to change notification settings - Fork 98
/
Copy pathProgram.cs
61 lines (51 loc) · 2.86 KB
/
Program.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
// Licensed under the MIT license: https://opensource.org/licenses/MIT
using System;
using System.IO;
using System.Threading.Tasks;
using NAudio.Wave.SampleProviders;
using NAudio.Wave;
using Whisper.net;
using Whisper.net.Ggml;
public class Program
{
// This example shows how to use the NAudio library to convert a wav file to a wav file with 16Khz sample rate and then use the Whisper library to process the wav file.
// The converstion is needed because the Whisper library only supports wav files with 16Khz sample rate, other sample rates are not supported and NotSupportedWaveException will be thrown.
public static async Task Main(string[] args)
{
// We declare three variables which we will use later, ggmlType, modelFileName and inputFileName
var ggmlType = GgmlType.Base;
var modelFileName = "ggml-base.bin";
var inputFileName = "kennedy44100.wav";
// This section detects whether the "ggml-base.bin" file exists in our project disk. If it doesn't, it downloads it from the internet
if (!File.Exists(modelFileName))
{
await DownloadModel(modelFileName, ggmlType);
}
// This section creates the whisperFactory object which is used to create the processor object.
using var whisperFactory = WhisperFactory.FromPath("ggml-base.bin");
// This section creates the processor object which is used to process the audio file, it uses language `auto` to detect the language of the audio file.
using var processor = whisperFactory.CreateBuilder()
.WithLanguage("auto")
.Build();
// This section opens the audio file and converts it to a wav file with 16Khz sample rate.
using var fileStream = File.OpenRead(inputFileName);
using var wavStream = new MemoryStream();
using var reader = new WaveFileReader(fileStream);
var resampler = new WdlResamplingSampleProvider(reader.ToSampleProvider(), 16000);
WaveFileWriter.WriteWavFileToStream(wavStream, resampler.ToWaveProvider16());
// This section sets the wavStream to the beginning of the stream. (This is required because the wavStream was written to in the previous section)
wavStream.Seek(0, SeekOrigin.Begin);
// This section processes the audio file and prints the results (start time, end time and text) to the console.
await foreach (var result in processor.ProcessAsync(wavStream))
{
Console.WriteLine($"{result.Start}->{result.End}: {result.Text}");
}
}
private static async Task DownloadModel(string fileName, GgmlType ggmlType)
{
Console.WriteLine($"Downloading Model {fileName}");
using var modelStream = await WhisperGgmlDownloader.GetGgmlModelAsync(ggmlType);
using var fileWriter = File.OpenWrite(fileName);
await modelStream.CopyToAsync(fileWriter);
}
}