2017-07-26 160 views
10

我试图录制音频并立即将其发送到IBM Watson Speech-To-Text进行转录。我已经测试了Watson从磁盘加载的WAV文件,并且工作。另一方面,我也测试了从麦克风录制并存储到磁盘,也很好。将WAV录制到IBM Watson语音转文本

但是,当我尝试使用NAudio WaveIn录制音频时,来自Watson的结果是空的,就好像没有音频一样。

任何人都可以照亮这一点,或有人有一些想法?

private async void StartHere() 
{ 
    var ws = new ClientWebSocket(); 
    ws.Options.Credentials = new NetworkCredential("*****", "*****"); 

    await ws.ConnectAsync(new Uri("wss://stream.watsonplatform.net/speech-to-text/api/v1/recognize?model=en-US_NarrowbandModel"), CancellationToken.None); 

    Task.WaitAll(ws.SendAsync(openingMessage, WebSocketMessageType.Text, true, CancellationToken.None), HandleResults(ws)); 

    Record(); 
} 

public void Record() 
{ 
    var waveIn = new WaveInEvent 
    { 
     BufferMilliseconds = 50, 
     DeviceNumber  = 0, 
     WaveFormat   = format 
    }; 

    waveIn.DataAvailable += new EventHandler(WaveIn_DataAvailable); 
    waveIn.RecordingStopped += new EventHandler(WaveIn_RecordingStopped); 
    waveIn.StartRecording(); 
} 

public void Stop() 
{ 
    await ws.SendAsync(closingMessage, WebSocketMessageType.Text, true, CancellationToken.None); 
} 

public void Close() 
{ 
    ws.CloseAsync(WebSocketCloseStatus.NormalClosure, "Close", CancellationToken.None).Wait(); 
} 

private void WaveIn_DataAvailable(object sender, WaveInEventArgs e) 
{ 
    await ws.SendAsync(new ArraySegment(e.Buffer), WebSocketMessageType.Binary, true, CancellationToken.None); 
} 

private async Task HandleResults(ClientWebSocket ws) 
{ 
    var buffer = new byte[1024]; 

    while (true) 
    { 
     var segment = new ArraySegment(buffer); 
     var result = await ws.ReceiveAsync(segment, CancellationToken.None); 

     if (result.MessageType == WebSocketMessageType.Close) 
     { 
      return; 
     } 

     int count = result.Count; 
     while (!result.EndOfMessage) 
     { 
      if (count >= buffer.Length) 
      { 
       await ws.CloseAsync(WebSocketCloseStatus.InvalidPayloadData, "That's too long", CancellationToken.None); 
       return; 
      } 

      segment = new ArraySegment(buffer, count, buffer.Length - count); 
      result = await ws.ReceiveAsync(segment, CancellationToken.None); 
      count += result.Count; 
     } 

     var message = Encoding.UTF8.GetString(buffer, 0, count); 

     // you'll probably want to parse the JSON into a useful object here, 
     // see ServiceState and IsDelimeter for a light-weight example of that. 
     Console.WriteLine(message); 

     if (IsDelimeter(message)) 
     { 
      return; 
     } 
    } 
} 

private bool IsDelimeter(String json) 
{ 
    MemoryStream stream = new MemoryStream(Encoding.UTF8.GetBytes(json)); 
    DataContractJsonSerializer ser = new DataContractJsonSerializer(typeof(ServiceState)); 
    ServiceState obj = (ServiceState) ser.ReadObject(stream); 

    return obj.state == "listening"; 
} 

[DataContract] 
internal class ServiceState 
{ 
    [DataMember] 
    public string state = ""; 
} 


编辑:我也尝试之前发送WAV“标题”来的StartRecording,这样

waveIn.DataAvailable += new EventHandler(WaveIn_DataAvailable); 
    waveIn.RecordingStopped += new EventHandler(WaveIn_RecordingStopped); 

    /* Send WAV "header" first */ 
    using (var stream = new MemoryStream()) 
    { 
     using (var writer = new BinaryWriter(stream, Encoding.UTF8)) 
     { 
      writer.Write(Encoding.UTF8.GetBytes("RIFF")); 
      writer.Write(0); // placeholder 
      writer.Write(Encoding.UTF8.GetBytes("WAVE")); 
      writer.Write(Encoding.UTF8.GetBytes("fmt ")); 

      format.Serialize(writer); 

      if (format.Encoding != WaveFormatEncoding.Pcm && format.BitsPerSample != 0) 
      { 
       writer.Write(Encoding.UTF8.GetBytes("fact")); 
       writer.Write(4); 
       writer.Write(0); 
      } 

      writer.Write(Encoding.UTF8.GetBytes("data")); 
      writer.Write(0); 
      writer.Flush(); 
     } 

     byte[] header = stream.ToArray(); 

     await ws.SendAsync(new ArraySegment(header), WebSocketMessageType.Binary, true, CancellationToken.None); 
    } 
    /* End WAV header */ 

    waveIn.StartRecording(); 

回答

相关问题