-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSWHear.py
203 lines (162 loc) · 7.13 KB
/
SWHear.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
"""
this is a stripped down version of the SWHear class.
It's designed to hold only a single audio sample in memory.
check my githib for a more complete version:
http://github.com/swharden
"""
# originally from /~https://github.com/swharden/Python-GUI-examples
import colorsys
import pyaudio
import time
import numpy as np
import subprocess
import threading
# import matplotlib.pyplot as plt
import sys
def getFFT(data, rate):
"""Given some data and rate, returns FFTfreq and FFT (half)."""
data = data * np.hamming(len(data)) # use a Hamming window to smooth out the data
fft = np.abs(np.fft.fft(data)) # get the fourier transform
# fft = 10 * np.log10(fft)
freq = np.fft.fftfreq(len(fft), 1.0 / rate) # get the frequencies for the x-axis
# return the bottom half of each array
return freq[:int(len(freq) / 2)], fft[:int(len(fft) / 2)]
class SWHear():
"""
The SWHear class is provides access to continuously recorded
(and mathematically processed) microphone data.
Arguments:
device - the number of the sound card input to use. Leave blank
to automatically detect one.
rate - sample rate to use. Defaults to something supported.
updatesPerSecond - how fast to record new data. Note that smaller
numbers allow more data to be accessed and therefore high
frequencies to be analyzed if using a FFT later
"""
def __init__(self, device=None, rate=None, updatesPerSecond=10):
self.p = pyaudio.PyAudio()
self.chunk = 4096 # gets replaced automatically
self.updatesPerSecond = updatesPerSecond
self.chunksRead = 0
self.device = device
self.rate = rate
### SYSTEM TESTS
def valid_low_rate(self, device):
"""set the rate to the lowest supported audio rate."""
for testrate in [48000, 44100]:
if self.valid_test(device, testrate):
return testrate
print("SOMETHING'S WRONG! I can't figure out how to use DEV", device)
return None
def valid_test(self, device, rate=44100):
"""given a device ID and a rate, return TRUE/False if it's valid."""
try:
self.info = self.p.get_device_info_by_index(device)
if not self.info['maxInputChannels'] > 0:
return False
stream = self.p.open(format=pyaudio.paInt16, channels=1,
input_device_index=device, frames_per_buffer=self.chunk,
rate=rate, input=True)
stream.close()
return True
except:
return False
def valid_input_devices(self):
"""
See which devices can be opened for microphone input.
call this when no PyAudio object is loaded.
"""
mics = [device for device in range(self.p.get_device_count()) if self.valid_test(device)]
if len(mics) == 0:
print('no microphone devices found!')
else:
print('found {} microphone device(s): {}'.format(len(mics), mics))
return mics
### SETUP AND SHUTDOWN
def initiate(self):
"""run this after changing settings (like rate) before recording"""
if self.device is None:
self.device = self.valid_input_devices()[0] #pick the first one
if self.rate is None:
self.rate = self.valid_low_rate(self.device)
if not self.valid_test(self.device, self.rate):
print('guessing a valid microphone device/rate...')
self.device = self.valid_input_devices()[0] #pick the first one
self.rate = self.valid_low_rate(self.device)
# Number of samples per update (e.g. at 10 updates/sec, hold 1/10 of a second in memory)
self.chunk = int(self.rate / self.updatesPerSecond)
# Time values for each sample in the chunk (not used).
self.datax = np.arange(self.chunk) / float(self.rate)
print('recording from "{}" (device {}) at {} Hz'
.format(self.info['name'], self.device, self.rate))
def close(self):
"""gently detach from things."""
print(" -- sending stream termination command...")
self.keepRecording = False #the threads should self-close
while self.t.isAlive(): #wait for all threads to close
time.sleep(.1)
self.stream.stop_stream()
self.p.terminate()
### STREAM HANDLING
def stream_readchunk(self):
"""reads some audio and re-launches itself"""
try:
self.data = np.frombuffer(self.stream.read(self.chunk), dtype=np.int16)
self.fftx, self.fft = getFFT(self.data, self.rate)
except Exception as E:
print(" -- exception! terminating...")
print(E, "\n" * 5)
self.keepRecording = False
if self.keepRecording:
self.stream_thread_new()
else:
self.stream.close()
self.p.terminate()
print(" -- stream STOPPED")
self.chunksRead += 1
def stream_thread_new(self):
self.t = threading.Thread(target=self.stream_readchunk)
self.t.start()
def stream_start(self):
"""adds data to self.data until termination signal"""
self.initiate()
print(" -- starting stream")
self.keepRecording = True # set this to False later to terminate stream
self.data = None # will fill up with threaded recording data
self.fft = None
self.dataFiltered = None #same
self.stream = self.p.open(format=pyaudio.paInt16, channels=1,
rate=self.rate, input=True, frames_per_buffer=self.chunk)
self.stream_thread_new()
if __name__=="__main__":
ear = SWHear(updatesPerSecond=10) # optionally set sample rate here
ear.stream_start() # goes forever
lastRead = ear.chunksRead
with subprocess.Popen(['glslViewer', 'flat.frag'], stdin=subprocess.PIPE, encoding='utf8') as glsl:
while True:
# wait for new data
while lastRead == ear.chunksRead:
# time.sleep(.01)
continue
if ear.data is not None and ear.fft is not None:
volume = np.max(np.abs(ear.data))
freq = ear.fftx
fft = np.abs(ear.fft)
frequency = freq[np.argmax(fft)]
print('Volume: {}, Frequency: {} Hz'.format(volume, frequency))
# plt.plot(freq, fft)
# plt.xlim(1, 800)
hue = frequency / 2000.0
value = min(1.0, volume / 12000.0)
r, g, b = colorsys.hsv_to_rgb(hue, 1.0, value)
lines = ['u_flatcolor,{},{},{}\n'.format(r, g, b)]
print(lines)
try:
glsl.stdin.writelines(lines)
glsl.stdin.flush()
except Exception as ex:
print('Exception:', ex)
lastRead = ear.chunksRead
# plt.show()
print("DONE")
ear.close()