firefox/testing/web-platform/tests/speech-api/SpeechRecognition-phrases-manual.https.html

<!DOCTYPE html>
<html lang="en">
<title>SpeechRecognition Phrases</title>

<script src="/resources/testharness.js"></script>
<script src="/resources/testharnessreport.js"></script>

<script>
async function getAudioTrackFromFile(filePath) {
    const audioContext = new AudioContext();
    const response = await fetch(filePath);
    const arrayBuffer = await response.arrayBuffer();
    const audioBuffer = await audioContext.decodeAudioData(arrayBuffer);
    const source = audioContext.createBufferSource();
    source.buffer = audioBuffer;

    const destination = audioContext.createMediaStreamDestination();
    source.connect(destination);
    source.start();

    return destination.stream.getAudioTracks()[0];
}

promise_test(async (t) => {
    // Verify the audio track for recognition context exists.
    const audioTrack = await getAudioTrackFromFile("/media/recognition_context.mp3");
    assert_true(
        audioTrack instanceof MediaStreamTrack,
        "Audio track should be a valid MediaStreamTrack"
    );

    // Create the first speech recognition with a mode that does not support contextual biasing.
    // Note that this may vary between browsers in the future.
    window.SpeechRecognition = window.SpeechRecognition || window.webkitSpeechRecognition;
    const recognition1 = new SpeechRecognition();
    recognition1.mode = "cloud-only";
    recognition1.lang = "en-US";

    recognition1.onerror = function(event) {
        assert_equals(
            event.error,
            "phrases-not-supported",
            "First speech recognition should throw a phrases-not-supported error"
        );
    };

    recognition1.phrases = new SpeechRecognitionPhraseList([
        new SpeechRecognitionPhrase("test", 1.0)
    ]);

    // Create the second speech recognition with a mode that supports contextual biasing.
    const recognition2 = new SpeechRecognition();
    recognition2.mode = "ondevice-only";
    recognition2.lang = "en-US";

    recognition2.onerror = function(event) {
        // Currently WPT may not be able to detect that SODA is available and
        // will throw a "language-not-supported" error here.
        assert_unreached("Caught an error: " + event.error);
    };

    recognition2.phrases = new SpeechRecognitionPhraseList([
        new SpeechRecognitionPhrase("ASIC", 1.0),
        new SpeechRecognitionPhrase("FPGA", 1.0)
    ]);

    const recognitionPromise = new Promise((resolve) => {
        recognition2.onresult = (event) => {
            const transcript = event.results[0][0].transcript;
            resolve(transcript);
        };
    });
    recognition2.start(audioTrack);

    const transcript = await recognitionPromise;
    assert_equals(
        transcript.toLowerCase(),
        "the report confirmed that the asic's throughput and " +
        "the fpga's latency were both below expectations",
        "Second speech recognition should correctly recognize the phrases"
    );
}, "SpeechRecognition should recognize speech with the given contextual information.");
</script>
</html>