1

这是我用于录制音频并将音频剪辑写为 wav 的代码

 public void startRec()
     {
         aud = Microphone.Start ( null, false, 10, 16000 );

     }
 public void stopRec()
     {
         Microphone.End(null);        
         Save ("test",aud);
          }
 public static bool Save(string filename, AudioClip clip) {
         if (!filename.ToLower().EndsWith(".wav")) {
             filename += ".wav";
         }

         string rootpath = Application.dataPath;

         var filepath = rootpath+"/"+filename;

         Debug.Log(filepath);

         // Make sure directory exists if user is saving to sub dir.
         Directory.CreateDirectory(Path.GetDirectoryName(filepath));

         using (var fileStream = CreateEmpty(filepath)) {

             ConvertAndWrite(fileStream, clip);

             WriteHeader(fileStream, clip);
         }

         return true; // TODO: return false if there's a failure saving the file
     }

 static void ConvertAndWrite(FileStream fileStream, AudioClip clip) {

         var samples = new float[clip.samples];

         clip.GetData(samples, 0);

         Int16[] intData = new Int16[samples.Length];
         //converting in 2 float[] steps to Int16[], //then Int16[] to Byte[]

         Byte[] bytesData = new Byte[samples.Length * 2];
         //bytesData array is twice the size of
         //dataSource array because a float converted in Int16 is 2 bytes.

         const float rescaleFactor = 32767; //to convert float to Int16

         for (int i = 0; i<samples.Length; i++) {
             intData[i] = (short) (samples[i] * rescaleFactor);
             Byte[] byteArr = new Byte[2];
             byteArr = BitConverter.GetBytes(intData[i]);
             byteArr.CopyTo(bytesData, i * 2);
         }

         fileStream.Write(bytesData, 0, bytesData.Length);
     }

     static void WriteHeader(FileStream fileStream, AudioClip clip) {

         var hz = clip.frequency;
         var channels = clip.channels;
         var samples = clip.samples;

         fileStream.Seek(0, SeekOrigin.Begin);

         Byte[] riff = System.Text.Encoding.UTF8.GetBytes("RIFF");
         fileStream.Write(riff, 0, 4);

         Byte[] chunkSize = BitConverter.GetBytes(fileStream.Length - 8);
         fileStream.Write(chunkSize, 0, 4);

         Byte[] wave = System.Text.Encoding.UTF8.GetBytes("WAVE");
         fileStream.Write(wave, 0, 4);

         Byte[] fmt = System.Text.Encoding.UTF8.GetBytes("fmt ");
         fileStream.Write(fmt, 0, 4);

         Byte[] subChunk1 = BitConverter.GetBytes(16);
         fileStream.Write(subChunk1, 0, 4);

         UInt16 two = 2;
         UInt16 one = 1;

         Byte[] audioFormat = BitConverter.GetBytes(one);
         fileStream.Write(audioFormat, 0, 2);

         Byte[] numChannels = BitConverter.GetBytes(channels);
         fileStream.Write(numChannels, 0, 2);

         Byte[] sampleRate = BitConverter.GetBytes(hz);
         fileStream.Write(sampleRate, 0, 4);

         Byte[] byteRate = BitConverter.GetBytes(hz * channels * 2); // sampleRate * bytesPerSample*number of channels, here 44100*2*2
         fileStream.Write(byteRate, 0, 4);

         UInt16 blockAlign = (ushort) (channels * 2);
         fileStream.Write(BitConverter.GetBytes(blockAlign), 0, 2);

         UInt16 bps = 16;
         Byte[] bitsPerSample = BitConverter.GetBytes(bps);
         fileStream.Write(bitsPerSample, 0, 2);

         Byte[] datastring = System.Text.Encoding.UTF8.GetBytes("data");
         fileStream.Write(datastring, 0, 4);

         Byte[] subChunk2 = BitConverter.GetBytes(samples * channels * 2);
         fileStream.Write(subChunk2, 0, 4);

         fileStream.Close();
     }

我已使用此链接https://gist.github.com/darktable/2317063中的脚本来保存音频文件。上面的代码录制了一个 wav 文件并保存,但是当我们尝试播放它时,录制的声音的音频质量和调制发生了变化,但它播放了录制的声音。

我需要将此 wav 文件转换为 base 64 并将其传递给 ispeech api,但它显示为错误的音频数据。所以我们联系了 ispeech 的支持团队,他们说我们设置采样率 = 16khz 比特率 = 16 位通道 = 单声道

但是我尝试设置这些值,但无法在此代码中设置我是统一和 c# 的新手,所以提前感谢任何帮助解决这个问题。

4

0 回答 0