forked from sandrohanea/whisper.net
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Fixed sandrohanea#57 Using WhisperProcessor.ProcessAsync more than on…
…ce (sandrohanea#58) * Fixed sandrohanea#57 Using WhisperProcessor.ProcessAsync more than once * Passed cancellationToken to processingSemaphore Wait and called WaitAsync * Simplified the initialization for ProcessInternalAsync
- Loading branch information
1 parent
51113a8
commit 9b627f0
Showing
3 changed files
with
186 additions
and
87 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,154 @@ | ||
// Licensed under the MIT license: https://opensource.org/licenses/MIT | ||
|
||
using FluentAssertions; | ||
using NUnit.Framework; | ||
using Whisper.net.Ggml; | ||
|
||
namespace Whisper.net.Tests; | ||
|
||
public class ProcessFunctionalTests | ||
{ | ||
private string ggmlModelPath = string.Empty; | ||
|
||
[OneTimeSetUp] | ||
public async Task SetupAsync() | ||
{ | ||
ggmlModelPath = Path.GetTempFileName(); | ||
var model = await WhisperGgmlDownloader.GetGgmlModelAsync(GgmlType.Tiny); | ||
using var fileWriter = File.OpenWrite(ggmlModelPath); | ||
await model.CopyToAsync(fileWriter); | ||
} | ||
|
||
[OneTimeTearDown] | ||
public void TearDown() | ||
{ | ||
File.Delete(ggmlModelPath); | ||
} | ||
|
||
[Test] | ||
public void TestHappyFlow() | ||
{ | ||
var segments = new List<SegmentData>(); | ||
var progress = new List<int>(); | ||
var encoderBegins = new List<EncoderBeginData>(); | ||
using var factory = WhisperFactory.FromPath(ggmlModelPath); | ||
using var processor = factory.CreateBuilder() | ||
.WithLanguage("en") | ||
.WithEncoderBeginHandler((e) => | ||
{ | ||
encoderBegins.Add(e); | ||
return true; | ||
}) | ||
.WithPrompt("I am Kennedy") | ||
.WithProgressHandler(progress.Add) | ||
.WithSegmentEventHandler(segments.Add) | ||
.Build(); | ||
|
||
using var fileReader = File.OpenRead("kennedy.wav"); | ||
processor.Process(fileReader); | ||
|
||
segments.Should().HaveCountGreaterThan(0); | ||
encoderBegins.Should().HaveCount(1); | ||
progress.Should().BeInAscendingOrder().And.HaveCountGreaterThan(1); | ||
|
||
segments.Should().Contain(segmentData => segmentData.Text.Contains("nation should commit")); | ||
} | ||
|
||
[Test] | ||
public void TestCancelEncoder() | ||
{ | ||
var segments = new List<SegmentData>(); | ||
var encoderBegins = new List<EncoderBeginData>(); | ||
using var factory = WhisperFactory.FromPath(ggmlModelPath); | ||
using var processor = factory.CreateBuilder() | ||
.WithLanguage("en") | ||
.WithEncoderBeginHandler((e) => | ||
{ | ||
encoderBegins.Add(e); | ||
return false; | ||
}) | ||
.WithSegmentEventHandler(segments.Add) | ||
.Build(); | ||
|
||
using var fileReader = File.OpenRead("kennedy.wav"); | ||
processor.Process(fileReader); | ||
|
||
segments.Should().HaveCount(0); | ||
encoderBegins.Should().HaveCount(1); | ||
} | ||
|
||
[Test] | ||
public async Task TestAutoDetectLanguageWithRomanian() | ||
{ | ||
var segments = new List<SegmentData>(); | ||
var encoderBegins = new List<EncoderBeginData>(); | ||
using var factory = WhisperFactory.FromPath(ggmlModelPath); | ||
using var processor = factory.CreateBuilder() | ||
.WithLanguageDetection() | ||
.WithEncoderBeginHandler((e) => | ||
{ | ||
encoderBegins.Add(e); | ||
return true; | ||
}) | ||
.Build(); | ||
using var fileReader = File.OpenRead("romana.wav"); | ||
await foreach (var segment in processor.ProcessAsync(fileReader)) | ||
{ | ||
segments.Add(segment); | ||
} | ||
segments.Should().HaveCountGreaterThan(0); | ||
encoderBegins.Should().HaveCount(1); | ||
segments.Should().AllSatisfy(s => s.Language.Should().Be("ro")); | ||
segments.Should().Contain(segmentData => segmentData.Text.Contains("efectua")); | ||
} | ||
|
||
[Test] | ||
public async Task Process_WhenMultichannel_ProcessCorrectly() | ||
{ | ||
var segments = new List<SegmentData>(); | ||
|
||
using var factory = WhisperFactory.FromPath(ggmlModelPath); | ||
await using var processor = factory.CreateBuilder() | ||
.WithLanguage("en") | ||
.WithSegmentEventHandler(segments.Add) | ||
.Build(); | ||
|
||
using var fileReader = File.OpenRead("multichannel.wav"); | ||
processor.Process(fileReader); | ||
|
||
segments.Should().HaveCountGreaterThanOrEqualTo(1); | ||
} | ||
|
||
[Test] | ||
public async Task Process_CalledMultipleTimes_Serially_WillCompleteEverytime() | ||
{ | ||
|
||
var segments1 = new List<SegmentData>(); | ||
var segments2 = new List<SegmentData>(); | ||
var segments3 = new List<SegmentData>(); | ||
|
||
OnSegmentEventHandler onNewSegment = segments1.Add; | ||
|
||
using var factory = WhisperFactory.FromPath(ggmlModelPath); | ||
await using var processor = factory.CreateBuilder() | ||
.WithLanguage("en") | ||
.WithSegmentEventHandler((s) => onNewSegment(s)) | ||
.Build(); | ||
|
||
using var fileReader1 = File.OpenRead("kennedy.wav"); | ||
processor.Process(fileReader1); | ||
|
||
onNewSegment = segments2.Add; | ||
|
||
using var fileReader2 = File.OpenRead("kennedy.wav"); | ||
processor.Process(fileReader2); | ||
|
||
onNewSegment = segments3.Add; | ||
|
||
using var fileReader3 = File.OpenRead("kennedy.wav"); | ||
processor.Process(fileReader3); | ||
|
||
segments1.Should().BeEquivalentTo(segments2); | ||
segments2.Should().BeEquivalentTo(segments3); | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters