Javascript 如何使用web音频api获取原始pcm音频?
usergetmedia如何在chrome中使用麦克风,然后通过流媒体获得原始音频?我需要得到线性16的音频 您应该查看API的属性。使用Javascript 如何使用web音频api获取原始pcm音频?,javascript,audio,web-audio-api,mediastream,Javascript,Audio,Web Audio Api,Mediastream,usergetmedia如何在chrome中使用麦克风,然后通过流媒体获得原始音频?我需要得到线性16的音频 您应该查看API的属性。使用sampleSize约束,如果音频硬件允许,可以将采样大小设置为16位 就实现而言,这就是链接和google的目的……不幸的是,MediaRecorder不支持原始PCM捕获。(在我看来,这是一个可悲的疏忽。)因此,您需要自己获取原始样本并缓冲/保存它们 你可以用这个。通常,此节点用于以编程方式修改音频数据,以实现自定义效果等。但是,没有理由不能将其用作捕获点
sampleSize
约束,如果音频硬件允许,可以将采样大小设置为16位
就实现而言,这就是链接和google的目的……不幸的是,MediaRecorder不支持原始PCM捕获。(在我看来,这是一个可悲的疏忽。)因此,您需要自己获取原始样本并缓冲/保存它们 你可以用这个。通常,此节点用于以编程方式修改音频数据,以实现自定义效果等。但是,没有理由不能将其用作捕获点。未经测试,但请尝试以下代码:
const captureNode = audioContext.createScriptProcessor(8192, 1, 1);
captureNode.addEventListener('audioprocess', (e) => {
const rawLeftChannelData = inputBuffer.getChannelData(0);
// rawLeftChannelData is now a typed array with floating point samples
});
(您可以在上找到更完整的示例。)
这些浮点样本以零为中心0
,理想情况下将绑定到-1
和1
。当转换为整数范围时,您需要将值钳制到此范围,剪裁超出该范围的任何内容。(如果浏览器中混入了响亮的声音,这些值有时可能会超过-1
和1
。理论上,浏览器还可以从外部声音设备录制32个样本,这些样本也可能超过该范围,但我不知道有哪个浏览器/平台可以做到这一点。)
转换为整数时,值是有符号还是无符号很重要。如果有符号,对于16位,范围为-32768
到32767
。对于未签名,它是0
到65535
。找出要使用的格式,并将-1
值缩放到1
值,直到达到该范围
关于此转换的最后一个注意事项。。。持久性可能很重要。另请参见:这里是一些Web音频API,它使用麦克风捕获和播放原始音频(在运行此页面之前请调低音量)。。。要查看PCM格式的原始音频片段,请查看浏览器控制台。。。对于kicks,它还将此PCM发送到对FFT的调用中,以获得音频曲线的频域和时域
<html><head><meta http-equiv="Content-Type" content="text/html; charset=ISO-8859-1">
<title>capture microphone then show time & frequency domain output</title>
<script type="text/javascript">
var webaudio_tooling_obj = function () {
var audioContext = new AudioContext();
console.log("audio is starting up ...");
var BUFF_SIZE_RENDERER = 16384;
var SIZE_SHOW = 3; // number of array elements to show in console output
var audioInput = null,
microphone_stream = null,
gain_node = null,
script_processor_node = null,
script_processor_analysis_node = null,
analyser_node = null;
if (!navigator.getUserMedia)
navigator.getUserMedia = navigator.getUserMedia || navigator.webkitGetUserMedia ||
navigator.mozGetUserMedia || navigator.msGetUserMedia;
if (navigator.getUserMedia){
navigator.getUserMedia({audio:true},
function(stream) {
start_microphone(stream);
},
function(e) {
alert('Error capturing audio.');
}
);
} else { alert('getUserMedia not supported in this browser.'); }
// ---
function show_some_data(given_typed_array, num_row_to_display, label) {
var size_buffer = given_typed_array.length;
var index = 0;
console.log("__________ " + label);
if (label === "time") {
for (; index < num_row_to_display && index < size_buffer; index += 1) {
var curr_value_time = (given_typed_array[index] / 128) - 1.0;
console.log(curr_value_time);
}
} else if (label === "frequency") {
for (; index < num_row_to_display && index < size_buffer; index += 1) {
console.log(given_typed_array[index]);
}
} else {
throw new Error("ERROR - must pass time or frequency");
}
}
function process_microphone_buffer(event) {
var i, N, inp, microphone_output_buffer;
// not needed for basic feature set
// microphone_output_buffer = event.inputBuffer.getChannelData(0); // just mono - 1 channel for now
}
function start_microphone(stream){
gain_node = audioContext.createGain();
gain_node.connect( audioContext.destination );
microphone_stream = audioContext.createMediaStreamSource(stream);
microphone_stream.connect(gain_node);
script_processor_node = audioContext.createScriptProcessor(BUFF_SIZE_RENDERER, 1, 1);
script_processor_node.onaudioprocess = process_microphone_buffer;
microphone_stream.connect(script_processor_node);
// --- enable volume control for output speakers
document.getElementById('volume').addEventListener('change', function() {
var curr_volume = this.value;
gain_node.gain.value = curr_volume;
console.log("curr_volume ", curr_volume);
});
// --- setup FFT
script_processor_analysis_node = audioContext.createScriptProcessor(2048, 1, 1);
script_processor_analysis_node.connect(gain_node);
analyser_node = audioContext.createAnalyser();
analyser_node.smoothingTimeConstant = 0;
analyser_node.fftSize = 2048;
microphone_stream.connect(analyser_node);
analyser_node.connect(script_processor_analysis_node);
var buffer_length = analyser_node.frequencyBinCount;
var array_freq_domain = new Uint8Array(buffer_length);
var array_time_domain = new Uint8Array(buffer_length);
console.log("buffer_length " + buffer_length);
script_processor_analysis_node.onaudioprocess = function() {
// get the average for the first channel
analyser_node.getByteFrequencyData(array_freq_domain);
analyser_node.getByteTimeDomainData(array_time_domain);
// draw the spectrogram
if (microphone_stream.playbackState == microphone_stream.PLAYING_STATE) {
show_some_data(array_freq_domain, SIZE_SHOW, "frequency");
show_some_data(array_time_domain, SIZE_SHOW, "time"); // store this to record to aggregate buffer/file
}
};
}
}(); // webaudio_tooling_obj = function()
</script>
</head>
<body>
<p>Volume</p>
<input id="volume" type="range" min="0" max="1" step="0.1" value="0.0"/>
<p> </p>
<button onclick="webaudio_tooling_obj()">start audio</button>
</body>
</html>
捕获麦克风,然后显示时域和频域输出
var webaudio_工具_obj=函数(){
var audioContext=新的audioContext();
log(“音频正在启动…”);
var BUFF_SIZE_渲染器=16384;
var SIZE_SHOW=3;//要在控制台输出中显示的数组元素数
var audioInput=null,
麦克风\u流=空,
增益节点=空,
脚本\处理器\节点=null,
脚本\处理器\分析\节点=空,
分析器_节点=空;
如果(!navigator.getUserMedia)
navigator.getUserMedia=navigator.getUserMedia | | navigator.webkitGetUserMedia||
navigator.mozGetUserMedia | | navigator.msGetUserMedia;
if(navigator.getUserMedia){
getUserMedia({audio:true},
功能(流){
启动麦克风(流);
},
职能(e){
警报(“捕获音频时出错”);
}
);
}else{alert('getUserMedia在此浏览器中不受支持。');}
// ---
函数显示某些数据(给定类型的数组、行到行显示、标签){
var size\u buffer=给定的\u类型的\u array.length;
var指数=0;
日志(“\uuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuuu;
如果(标签==“时间”){
对于(;索引