使用jacob+SAPI5.1实现将将文字转换为语音播放并可存储到.wav文件
2009-11-27 17:16
971 查看
运行此代码需要Microsoft Speech SDK 5.1和jacob-1.14.3
1、MSTTSSpeech.java
2、SoundUtil.java-将.wav文件转换成.pcm格式文件
1、MSTTSSpeech.java
package com.longtop.core.speech; import com.jacob.activeX.ActiveXComponent; import com.jacob.com.ComThread; import com.jacob.com.Dispatch; import com.jacob.com.Variant; import com.longtop.core.util.sound.SoundUtil; /** * 调用MSTTS将字符串转换成语音信息 * * @author liqiang4j */ public class MSTTSSpeech{ private int volume = 100;// 声音:1到100 private int rate = 0;// 频率:-10到10 private int voice = 0;// 语音库序号 private int audio = 0;// 输出设备序号 private ActiveXComponent ax = null; private Dispatch spVoice = null;// 声音对象 private Dispatch spFileStream = null;// 音频文件输出流对象,在读取或保存音频文件时使用 private Dispatch spAudioFormat = null;// 音频格式对象 private Dispatch spMMAudioOut = null;// 音频输出对象 private int formatType = 22;// 音频的输出格式,默认为:SAFT22kHz16BitMono public MSTTSSpeech() { ComThread.InitSTA(); if(ax == null){ ax = new ActiveXComponent("Sapi.SpVoice"); spVoice = ax.getObject(); } } /** * 改变语音库 * * @param voice * 语音库序号 */ public void changeVoice(int voice){ if(this.voice != voice){ this.voice = voice; } try{ Dispatch voiceItems = Dispatch.call(spVoice, "GetVoices").toDispatch(); int count = Integer.valueOf(Dispatch.call(voiceItems, "Count").toString()); if(count > 0){ Dispatch voiceItem = Dispatch.call(voiceItems, "Item", new Variant(this.voice)).toDispatch(); Dispatch.put(spVoice, "Voice", voiceItem); } } catch (Exception e){ e.printStackTrace(); } } /** * 改变音频输出设备 * * @param audio * 音频设备序号 */ public void changeAudioOutput(int audio){ if(this.audio != audio){ this.audio = audio; } try{ Dispatch audioOutputs = Dispatch.call(spVoice, "GetAudioOutputs").toDispatch(); int count = Integer.valueOf(Dispatch.call(audioOutputs, "Count").toString()); if(count > 0){ Dispatch audioOutput = Dispatch.call(audioOutputs, "Item", new Variant(this.audio)).toDispatch(); Dispatch.put(spVoice, "AudioOutput", audioOutput); } } catch (Exception e){ e.printStackTrace(); } } /** * 播放语音 * * @param text * 要转换成语音的文本 */ public void speak(String text){ this.speak(text, 0); } /** * 停止播放语音 */ public void stop(){ // this.speak("", 1); Dispatch.call(spVoice, "Pause"); } /** * 播放语音 * * @param text * 要转换成语音的文本 * @param type * 类型0:播放,1:停止 */ private void speak(String text,int type){ switch (type) { case 0: try{ // 调整音量和读的速度 Dispatch.put(spVoice, "Volume", new Variant(this.volume));// 设置音量 Dispatch.put(spVoice, "Rate", new Variant(this.rate));// 设置速率 // 设置音频格式类型 if(spAudioFormat == null){ ax = new ActiveXComponent("Sapi.SpAudioFormat"); spAudioFormat = ax.getObject(); ax = new ActiveXComponent("Sapi.SpMMAudioOut"); spMMAudioOut = ax.getObject(); } Dispatch.put(spAudioFormat, "Type", new Variant(this.formatType)); Dispatch.putRef(spMMAudioOut, "Format", spAudioFormat); Dispatch.put(spVoice, "AllowAudioOutputFormatChangesOnNextSet", new Variant(false)); Dispatch.putRef(spVoice, "AudioOutputStream", spMMAudioOut); // 开始朗读 Dispatch.call(spVoice, "Speak", new Variant(text)); } catch (Exception e){ e.printStackTrace(); } break; case 1: try{ Dispatch.call(spVoice, "Speak", new Variant(text), new Variant(2)); } catch (Exception e){ e.printStackTrace(); } break; default: break; } } /** * 获取系统中所有的语音库名称数组 * * @return String[] */ public String[] getVoices(){ String[] voices = null; try{ Dispatch voiceItems = Dispatch.call(spVoice, "GetVoices").toDispatch(); int count = Integer.valueOf(Dispatch.call(voiceItems, "Count").toString()); if(count > 0){ voices = new String[count]; for(int i = 0;i < count;i++){ Dispatch voiceItem = Dispatch.call(voiceItems, "Item", new Variant(i)).toDispatch(); String voice = Dispatch.call(voiceItem, "GetDescription").toString(); voices[i] = voice; } } } catch (Exception e){ e.printStackTrace(); } return voices; } /** * 获取音频输出设备名称数组 * * @return String[] */ public String[] getAudioOutputs(){ String[] result = null; try{ Dispatch audioOutputs = Dispatch.call(spVoice, "GetAudioOutputs").toDispatch(); int count = Integer.valueOf(Dispatch.call(audioOutputs, "Count").toString()); if(count > 0){ result = new String[count]; for(int i = 0;i < count;i++){ Dispatch voiceItem = Dispatch.call(audioOutputs, "Item", new Variant(i)).toDispatch(); String voice = Dispatch.call(voiceItem, "GetDescription").toString(); result[i] = voice; } } } catch (Exception e){ e.printStackTrace(); } return result; } /** * 将文字转换成音频信号,然后输出到.WAV文件 * * @param text * 文本字符串 * @param filePath * 输出文件路径 */ public void saveToWav(String text,String filePath){ // 创建输出文件流对象 ax = new ActiveXComponent("Sapi.SpFileStream"); spFileStream = ax.getObject(); // 创建音频流格式对象 if(spAudioFormat == null){ ax = new ActiveXComponent("Sapi.SpAudioFormat"); spAudioFormat = ax.getObject(); } // 设置音频流格式类型 Dispatch.put(spAudioFormat, "Type", new Variant(this.formatType)); // 设置文件输出流的格式 Dispatch.putRef(spFileStream, "Format", spAudioFormat); // 调用输出文件流对象的打开方法,创建一个.wav文件 Dispatch.call(spFileStream, "Open", new Variant(filePath), new Variant(3), new Variant(true)); // 设置声音对象的音频输出流为输出文件流对象 Dispatch.putRef(spVoice, "AudioOutputStream", spFileStream); // 调整音量和读的速度 Dispatch.put(spVoice, "Volume", new Variant(this.volume));// 设置音量 Dispatch.put(spVoice, "Rate", new Variant(this.rate));// 设置速率 // 开始朗读 Dispatch.call(spVoice, "Speak", new Variant(text)); // 关闭输出文件流对象,释放资源 Dispatch.call(spFileStream, "Close"); Dispatch.putRef(spVoice, "AudioOutputStream", null); } /** * @return the volume */ public int getVolume(){ return volume; } /** * @param volume * the volume to set */ public void setVolume(int volume){ this.volume = volume; } /** * @return the rate */ public int getRate(){ return rate; } /** * @param rate * the rate to set */ public void setRate(int rate){ this.rate = rate; } /** * @return the voice */ public int getVoice(){ return voice; } /** * @param voice * the voice to set */ public void setVoice(int voice){ this.voice = voice; } /** * @return the audio */ public int getAudio(){ return audio; } /** * @param audio * the audio to set */ public void setAudio(int audio){ this.audio = audio; } /** * @return the ax */ public ActiveXComponent getAx(){ return ax; } /** * @param ax * the ax to set */ public void setAx(ActiveXComponent ax){ this.ax = ax; } /** * @return the formatType */ public int getFormatType(){ return formatType; } /** * 设置音频输出格式类型<br> * SAFTDefault = -1<br> * SAFTNoAssignedFormat = 0<br> * SAFTText = 1<br> * SAFTNonStandardFormat = 2<br> * SAFTExtendedAudioFormat = 3<br> * // Standard PCM wave formats<br> * SAFT8kHz8BitMono = 4<br> * SAFT8kHz8BitStereo = 5<br> * SAFT8kHz16BitMono = 6<br> * SAFT8kHz16BitStereo = 7<br> * SAFT11kHz8BitMono = 8<br> * SAFT11kHz8BitStereo = 9<br> * SAFT11kHz16BitMono = 10<br> * SAFT11kHz16BitStereo = 11<br> * SAFT12kHz8BitMono = 12<br> * SAFT12kHz8BitStereo = 13<br> * SAFT12kHz16BitMono = 14<br> * SAFT12kHz16BitStereo = 15<br> * SAFT16kHz8BitMono = 16<br> * SAFT16kHz8BitStereo = 17<br> * SAFT16kHz16BitMono = 18<br> * SAFT16kHz16BitStereo = 19<br> * SAFT22kHz8BitMono = 20<br> * SAFT22kHz8BitStereo = 21<br> * SAFT22kHz16BitMono = 22<br> * SAFT22kHz16BitStereo = 23<br> * SAFT24kHz8BitMono = 24<br> * SAFT24kHz8BitStereo = 25<br> * SAFT24kHz16BitMono = 26<br> * SAFT24kHz16BitStereo = 27<br> * SAFT32kHz8BitMono = 28<br> * SAFT32kHz8BitStereo = 29<br> * SAFT32kHz16BitMono = 30<br> * SAFT32kHz16BitStereo = 31<br> * SAFT44kHz8BitMono = 32<br> * SAFT44kHz8BitStereo = 33<br> * SAFT44kHz16BitMono = 34<br> * SAFT44kHz16BitStereo = 35<br> * SAFT48kHz8BitMono = 36<br> * SAFT48kHz8BitStereo = 37<br> * SAFT48kHz16BitMono = 38<br> * SAFT48kHz16BitStereo = 39<br> * <br> * // TrueSpeech format<br> * SAFTTrueSpeech_8kHz1BitMono = 40<br> * // A-Law formats<br> * SAFTCCITT_ALaw_8kHzMono = 41<br> * SAFTCCITT_ALaw_8kHzStereo = 42<br> * SAFTCCITT_ALaw_11kHzMono = 43<br> * SAFTCCITT_ALaw_11kHzStereo = 4<br> * SAFTCCITT_ALaw_22kHzMono = 44<br> * SAFTCCITT_ALaw_22kHzStereo = 45<br> * SAFTCCITT_ALaw_44kHzMono = 46<br> * SAFTCCITT_ALaw_44kHzStereo = 47<br> * <br> * // u-Law formats<br> * SAFTCCITT_uLaw_8kHzMono = 48<br> * SAFTCCITT_uLaw_8kHzStereo = 49<br> * SAFTCCITT_uLaw_11kHzMono = 50<br> * SAFTCCITT_uLaw_11kHzStereo = 51<br> * SAFTCCITT_uLaw_22kHzMono = 52<br> * SAFTCCITT_uLaw_22kHzStereo = 53<br> * SAFTCCITT_uLaw_44kHzMono = 54<br> * SAFTCCITT_uLaw_44kHzStereo = 55<br> * SAFTADPCM_8kHzMono = 56<br> * SAFTADPCM_8kHzStereo = 57<br> * SAFTADPCM_11kHzMono = 58<br> * SAFTADPCM_11kHzStereo = 59<br> * SAFTADPCM_22kHzMono = 60<br> * SAFTADPCM_22kHzStereo = 61<br> * SAFTADPCM_44kHzMono = 62<br> * SAFTADPCM_44kHzStereo = 63<br> * <br> * // GSM 6.10 formats<br> * SAFTGSM610_8kHzMono = 64<br> * SAFTGSM610_11kHzMono = 65<br> * SAFTGSM610_22kHzMono = 66<br> * SAFTGSM610_44kHzMono = 67<br> * // Other formats<br> * SAFTNUM_FORMATS = 68<br> * * @param formatType * 音频输出格式类型 */ public void setFormatType(int formatType){ this.formatType = formatType; } public static void main(String[] args){ MSTTSSpeech speech = new MSTTSSpeech(); String text = "这是我的测试,物理内存至少需要512MB,建议2GB以上,虚拟内存是主机物理内存的两倍,不要设到系统盘,硬盘空闲空间大于4.77GB."; speech.setFormatType(4); //speech.speak(text); // speech.setRate(-1); speech.saveToWav(text, "e://test.wav"); SoundUtil.wavToPcm("e://test.wav"); } }
2、SoundUtil.java-将.wav文件转换成.pcm格式文件
package com.longtop.core.util.sound; import java.io.File; import java.io.IOException; import javax.sound.sampled.AudioFileFormat; import javax.sound.sampled.AudioFormat; import javax.sound.sampled.AudioInputStream; import javax.sound.sampled.AudioSystem; import javax.sound.sampled.UnsupportedAudioFileException; /** * 与声音有关的工具类 * * @author liqiang4j */ public class SoundUtil{ /** * 将WAV格式的音频文件转换为PCM格式的文件 * * @param wavFilePath * WAV文件路径 * @throws UnsupportedAudioFileException * @throws IOException */ public static void wavToPcm(String wavFilePath){ try{ File wavFile = new File(wavFilePath); AudioInputStream sourceAudioInputStream = AudioSystem.getAudioInputStream(wavFile); // 此处的转换必需是16bit的音频文件 AudioInputStream targetAudioInputStream = AudioSystem.getAudioInputStream(AudioFormat.Encoding.ULAW, sourceAudioInputStream); String newFilePath = wavFilePath.substring(0, wavFilePath.lastIndexOf(".") + 1) + "pcm"; AudioSystem.write(targetAudioInputStream, AudioFileFormat.Type.WAVE, new File(newFilePath)); } catch (UnsupportedAudioFileException e){ e.printStackTrace(); } catch (IOException e){ e.printStackTrace(); } } /** * 获取音频文件的编码格式 * * @param wavFilePath * 音频文件格式 * @return String */ public static String getWavFormat(String wavFilePath){ File wavFile = new File(wavFilePath); AudioInputStream ais; String result = ""; try{ ais = AudioSystem.getAudioInputStream(wavFile); AudioFormat af = ais.getFormat(); result = af.toString(); } catch (UnsupportedAudioFileException e){ e.printStackTrace(); } catch (IOException e){ e.printStackTrace(); } return result; } public static void main(String[] args){ System.out.println(SoundUtil.getWavFormat("e://test.wav")); SoundUtil.wavToPcm("e://test.wav"); } }
相关文章推荐
- JAVA 使用Jacob调用windows的Sapi实现文本转语音文件
- JAVA 使用Jacob调用windows的Sapi实现文本转语音文件
- 如何将语音文件转换为Asterisk可以播放的音频格式文件(.wav)
- C++ builder TTS5.1实现语音播放 生成wav文件
- 使用jacob调用Windows的com对象,转换Office文件为pdf、html等
- Wave 文件(12): 使用 waveOut...重复播放 wav 文件
- linux 基于alsa 使用libmad 解码库实现MP3文件的播放
- 使用aplay播放一个PCM?PCM和WAV文件的区别?
- C#使用XmlEDocument实现数据文件安全存储功能
- Ubuntu下使用ISCSI+OCFS2实现网络存储及文件共享
- 使用文件实现通讯录的存储
- 使用python来访问Hadoop HDFS存储实现文件的操作
- 使用讯飞SDK,实现文字在线合成语音
- 文字转换为语音VB.NEt实现
- C# 使用FileUpload控件上传图片,将文件转换成二进制进行存储与读取
- 使用UltraEdit 替换解决---文字中含有逗号的文件,如何把逗号自动转换成为:回车换行呢?
- 使用FlashWavRecorder实现浏览器录制wav音频和上传音频文件,兼容IE8以上浏览器
- C#使用SoundPlayer播放WAV音频文件
- 使用DirectX播放wav声音文件
- 实现KTV效果:播放歌曲,录音(存储录音文件),并同步播放录音 & 解释4.3以上audio与media资源冲突问题