How to Create Speech to Text in wpf c# application

Question

I need an application which take live voice speech and convert into text in wpf C# application

Accepted Answer

As Castorix31 said, you could use SpeechRecognitionEngine. Here is an example, you can try to refer to it.

Add a reference to System.Speech to the project.

MainWindow.xaml:

    
          
              
                  
                  
                  
              
              
                  
                  
                  
                  
              
  
            Hypothesized  
            Recognized  
              
            Status:  
            Speak "End Dictate" to stop.

MainWinodw.xmal.cs:

using System;  
using System.Linq;  
using System.Windows;  
using System.Speech.Recognition;  
using System.Threading;  
using System.Speech.Synthesis;  
  
namespace SpeechToTextDemo  
{  
    public partial class MainWindow : Window  
    {  
        private enum State  
        {  
            Idle = 0,  
            Accepting = 1,  
            Off = 2,  
        }  
  
        private State RecogState = State.Off;  
        private SpeechRecognitionEngine srecog;  
        private SpeechSynthesizer synth = null;          
        private int Hypothesized = 0;  
        private int Recognized = 0;  
        public MainWindow()  
        {  
            InitializeComponent();  
            this.Loaded += new RoutedEventHandler(MainWindow_Loaded);  
        }  
        private void MainWindow_Loaded(object sender, RoutedEventArgs e)  
        {  
            InitializeRecognizerSynthesizer();  
  
            if (SelectInputDevice())  
            {  
                LoadDictationGrammar();  
                btnStart.IsEnabled = true;  
                ReadAloud("Speech Engine Ready for Input");  
            }  
        }  
  
        private void InitializeRecognizerSynthesizer()  
        {  
            var selectedRecognizer = (from o in SpeechRecognitionEngine.InstalledRecognizers()  
                                      where o.Culture.Equals(Thread.CurrentThread.CurrentCulture)  
                                      select o).FirstOrDefault();  
            srecog = new SpeechRecognitionEngine(selectedRecognizer);  
            srecog.AudioStateChanged+=new EventHandler(recognizer_AudioStateChanged);  
            srecog.SpeechHypothesized += new EventHandler(recognizer_SpeechHypothesized);  
            srecog.SpeechRecognized += new EventHandler(recognizer_SpeechRecognized);  
  
            synth = new SpeechSynthesizer();  
        }  
  
        private bool SelectInputDevice()  
        {  
            bool proceedLoading = true;  
            if (IsOscompatible())  
            {  
                try  
                {  
                    srecog.SetInputToDefaultAudioDevice();  
                }  
                catch  
                {  
                    proceedLoading = false;   
                }  
            }  
            else  
                ThreadPool.QueueUserWorkItem(InitSpeechRecogniser);  
            return proceedLoading;  
        }  
  
        private bool IsOscompatible()  
        {  
            OperatingSystem osInfo = Environment.OSVersion;  
            if (osInfo.Version > new Version("6.0"))  
                return true;  
            else  
                return false;  
        }  
  
        private void InitSpeechRecogniser(object o)  
        {  
            srecog.SetInputToDefaultAudioDevice();  
        }  
  
        private void LoadDictationGrammar()  
        {  
            GrammarBuilder grammarBuilder = new GrammarBuilder();  
            grammarBuilder.Append(new Choices("End Dictate"));  
            Grammar commandGrammar = new Grammar(grammarBuilder);  
            commandGrammar.Name = "main command grammar";  
            srecog.LoadGrammar(commandGrammar);  
  
            DictationGrammar dictationGrammar = new DictationGrammar();  
            dictationGrammar.Name = "dictation";  
            srecog.LoadGrammar(dictationGrammar);  
        }  
  
        private void recognizer_AudioStateChanged(object sender, AudioStateChangedEventArgs e)  
        {  
            switch (e.AudioState)  
            {  
                case AudioState.Speech:  
                   lStatus.Content = "Listening";  
                    break;  
                case AudioState.Silence:  
                    lStatus.Content = "Idle";  
                    break;  
                case AudioState.Stopped:  
                    lStatus.Content = "Stopped";  
                    break;  
            }  
        }  
  
        private void recognizer_SpeechHypothesized(object sender, SpeechHypothesizedEventArgs e)  
        {  
            Hypothesized++;  
            tHypothesized.Text = "Hypothesized: " + Hypothesized.ToString();  
        }  
        private void recognizer_SpeechRecognized(object sender, SpeechRecognizedEventArgs e)  
        {  
            Recognized++;  
            tRecognized.Text = "Recognized: " + Recognized.ToString();  
  
            if (RecogState == State.Off)  
                return;  
            float accuracy = (float)e.Result.Confidence;  
            string phrase = e.Result.Text;  
            {  
                if (phrase == "End Dictate")  
                {  
                    RecogState = State.Off;  
                    srecog.RecognizeAsyncStop();  
                    ReadAloud("Dictation Ended");  
                    return;  
                }  
                TextBox1.AppendText(" " + e.Result.Text);  
            }  
        }   
  
        public void ReadAloud(string speakText)  
        {  
            try  
            {  
                srecog.RecognizeAsyncCancel();  
                synth.SpeakAsync(speakText);  
            }  
            catch { }  
        }  
  
  
        private void btnStart_Click(object sender, RoutedEventArgs e)  
        {  
            switch (RecogState)  
            {  
                case State.Off:  
                    RecogState = State.Accepting;  
                    btnStart.Content = "Stop";  
                    srecog.RecognizeAsync(RecognizeMode.Multiple);  
                    break;  
                case State.Accepting:  
                    RecogState = State.Off;  
                    btnStart.Content = "Start";  
                    srecog.RecognizeAsyncStop();  
                    break;  
            }  
        }  
    }  
}

----------------------------------------------------------------------------

If the response is helpful, please click "Accept Answer" and upvote it.
Note: Please follow the steps in our documentation to enable e-mail notifications if you want to receive the related email notification for this thread.

Answer

Speech to Text
speech and convert into text

Which one now, Speech to text or text to speech?
Search on internet, you will find for both examples & solutions.

Answer

There should be SpeechRecognitionEngine,
but I cannot make it work on my french OS (although I configured Speech Recognition in Control Panel)

Answer

Open Visual Studio and create a new Console Application project.

Add a reference to the System. Speech assembly. Right-click on the project in Solution Explorer, select Add Reference, and then choose System. Speech from the list of assemblies.

In the Program.cs file

Answer

Create WPF window as below


    
        
            
                
                
                
            
            
                
                
                
                
            
            
            Hypothesized
            Recognized
            
            Status:
            Speak "End Dictate" to stop.

Share via

How to Create Speech to Text in wpf c# application

4 additional answers