我想从PyAudio中的声音数据中获取左右声道的数据。我有一维形状数组,但不知道其中哪些来自 channel
我尝试将前半部分数据更改为零。我有沉默。 我试图将每个第二个数字更改为零。我有沉默。 在文档中我看到 PyAudio 有一个参数“output_channels”。我认为它有多个输出 channel 。
import pyaudio
import numpy as np
CHUNK = 102
WIDTH = 2
#CHUNK = 10404
#RATE = 192000
CHANNELS = 2
RATE = 44100
p = pyaudio.PyAudio()
stream = p.open(format=p.get_format_from_width(WIDTH),
channels=CHANNELS,
rate=RATE,
input=True,
output=True,
frames_per_buffer=CHUNK)
frames_per_buffer = 44100
data=[]
n=0
a=np.zeros(CHUNK*CHANNELS*WIDTH)
for i in range(1000):
data.append(stream.read(CHUNK))
for m in range(CHUNK):
a[m]=data[0][m]
s_0=[]
for m in range(int(CHUNK*CHANNELS*WIDTH)):
s_0.append(int(data[0][m]))
a=np.asarray(s_0)
a=a.reshape(int(CHUNK*WIDTH), 2)
a_T = np.transpose(a)
a_T[1][:] = 0
a = np.transpose(a_T)
a = a.reshape(CHUNK*CHANNELS*WIDTH)
s_2=[]
for m in range(CHUNK*CHANNELS*WIDTH):
s_2.append(int(a[m]))
sound=[bytes(s_2)]
stream.write(sound.pop(0), CHUNK)
data=[]
print('s_0')
s_0[0:20]
print('s_2')
s_2[0:20]
如果我更改数据,声音不会播放
最佳答案
这可以从立体声文件中获取 channel 0:
import pyaudio
import wave
import numpy as np
chunk = 1024
# open up a wave
wf = wave.open('/home/jeremy/Music/440.wav', 'rb')
swidth = wf.getsampwidth()
RATE = wf.getframerate()
# open stream
p = pyaudio.PyAudio()
channels = wf.getnchannels()
stream = p.open(format =
p.get_format_from_width(wf.getsampwidth()),
channels = channels,
rate = RATE,
output = True)
# read some data
data = wf.readframes(chunk)
while len(data) == chunk*swidth*channels:
# write data out to the audio stream
stream.write(data)
indata = np.fromstring(data, dtype='int16')
# deinterleave, select 1 channel
channel0 = indata[0::channels]
data = wf.readframes(chunk)
if data:
stream.write(data)
stream.close()
p.terminate()
关于python - 如何在PyAudio中获取 channel 数据,我们在Stack Overflow上找到一个类似的问题: https://stackoverflow.com/questions/56918526/