more hey jibo and word of the day changes

This commit is contained in:
Jacob Dubin
2026-04-18 21:41:21 -05:00
parent d4b33a1635
commit 16768a0c80
13 changed files with 5994 additions and 0 deletions

View File

@@ -39,6 +39,11 @@ public sealed class WebSocketTurnFinalizationService(
CancellationToken cancellationToken = default)
{
var turnState = session.TurnState;
if (ShouldIgnoreLateAudio(session))
{
return [];
}
session.LastMessageType = "BINARY_AUDIO";
turnState.FirstAudioReceivedUtc ??= DateTimeOffset.UtcNow;
turnState.BufferedAudioChunkCount += 1;
@@ -312,6 +317,7 @@ public sealed class WebSocketTurnFinalizationService(
turnState.SawContext = false;
turnState.ListenHotphrase = false;
turnState.HotphraseEmptyTurnCount = 0;
turnState.IgnoreAdditionalAudioUntilUtc = null;
turnState.ListenRules = [];
turnState.ListenAsrHints = [];
}
@@ -359,6 +365,11 @@ public sealed class WebSocketTurnFinalizationService(
}
var turnState = session.TurnState;
if (ShouldTreatBufferedHotphraseAsGreeting(finalizedTurn, turnState, allowFallbackOnMissingTranscript))
{
finalizedTurn = WithSyntheticTranscript(finalizedTurn, "hello");
}
if (ShouldIgnoreCompletedWordOfDayTurn(finalizedTurn))
{
turnState.AwaitingTurnCompletion = false;
@@ -459,6 +470,9 @@ public sealed class WebSocketTurnFinalizationService(
? DateTimeOffset.UtcNow.Add(plan.FollowUp.Timeout)
: null;
turnState.AwaitingTurnCompletion = false;
turnState.IgnoreAdditionalAudioUntilUtc = plan.FollowUp.KeepMicOpen
? null
: DateTimeOffset.UtcNow.Add(WebSocketTurnState.DefaultLateAudioIgnoreWindow);
var emitSkillActions = messageType != "CLIENT_NLU" &&
!string.Equals(plan.IntentName, "word_of_the_day", StringComparison.OrdinalIgnoreCase) &&
@@ -488,6 +502,15 @@ public sealed class WebSocketTurnFinalizationService(
turnAge >= AutoFinalizeMinTurnAge;
}
private static bool ShouldIgnoreLateAudio(CloudSession session)
{
var ignoreUntilUtc = session.TurnState.IgnoreAdditionalAudioUntilUtc;
return !session.TurnState.AwaitingTurnCompletion &&
!session.FollowUpOpen &&
ignoreUntilUtc.HasValue &&
ignoreUntilUtc.Value > DateTimeOffset.UtcNow;
}
private static string? ExtractDataPayload(string? text)
{
if (string.IsNullOrWhiteSpace(text))
@@ -701,6 +724,31 @@ public sealed class WebSocketTurnFinalizationService(
.Any(static rule => string.Equals(rule, "word-of-the-day/right_word", StringComparison.OrdinalIgnoreCase));
}
private static bool ShouldTreatBufferedHotphraseAsGreeting(
TurnContext turn,
WebSocketTurnState turnState,
bool allowFallbackOnMissingTranscript)
{
if (!allowFallbackOnMissingTranscript || !ReadBoolAttribute(turn, "listenHotphrase"))
{
return false;
}
if (!ReadRules(turn, "listenRules")
.Any(static rule => string.Equals(rule, "launch", StringComparison.OrdinalIgnoreCase)))
{
return false;
}
if (!string.IsNullOrWhiteSpace(turn.NormalizedTranscript) || !string.IsNullOrWhiteSpace(turn.RawTranscript))
{
return false;
}
return turnState.BufferedAudioBytes >= AutoFinalizeMinBufferedAudioBytes &&
(turnState.FinalizeAttemptCount > 0 || !string.IsNullOrWhiteSpace(turnState.LastSttError));
}
private static bool ShouldTreatEmptyHotphraseTurnAsGreeting(TurnContext turn)
{
if (!string.IsNullOrWhiteSpace(turn.NormalizedTranscript) || !string.IsNullOrWhiteSpace(turn.RawTranscript))

View File

@@ -2,10 +2,13 @@ namespace Jibo.Cloud.Domain.Models;
public sealed class WebSocketTurnState
{
public static readonly TimeSpan DefaultLateAudioIgnoreWindow = TimeSpan.FromSeconds(2);
public string? TransId { get; set; }
public string? ContextPayload { get; set; }
public bool ListenHotphrase { get; set; }
public int HotphraseEmptyTurnCount { get; set; }
public DateTimeOffset? IgnoreAdditionalAudioUntilUtc { get; set; }
public string? AudioTranscriptHint { get; set; }
public string? LastSttError { get; set; }
public DateTimeOffset? LastSttErrorUtc { get; set; }