SpyMaster607/testAll.py at main · rocketcrane/SpyMaster607 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
# TODO: logarithmic potentiometer

try:
	import RPi.GPIO as GPIO
	import adafruit_mcp3xxx.mcp3008 as MCP
	import busio
	import digitalio
	import board
	from adafruit_mcp3xxx.analog_in import AnalogIn
except:
	print("not on Pi")

from datetime import datetime
from pathlib import Path
from openai import OpenAI
from dotenv import load_dotenv
from time import sleep
from multiprocessing import Process
import os
import pyaudio
import pydub
import wave
import time
import multiprocessing
from ctypes import c_char_p
from ctypes import c_uint8
import pyttsx3
load_dotenv()
client = OpenAI()

try:
	# GPIO & potentiometer setup
	GPIO.setmode(GPIO.BCM)
	# pin numbers for buttons/switches
	vol = 16
	lev = 23
	but = 25
	GPIO.setup(vol, GPIO.IN, pull_up_down=GPIO.PUD_UP)
	GPIO.setup(lev, GPIO.IN, pull_up_down=GPIO.PUD_UP)
	GPIO.setup(but, GPIO.IN, pull_up_down=GPIO.PUD_UP)
	# create the SPI bus
	spi = busio.SPI(clock=board.SCK, MISO=board.MISO, MOSI=board.MOSI)
	# create the CS (chip select)
	cs = digitalio.DigitalInOut(board.D22)
	# create the MCP object
	mcp = MCP.MCP3008(spi, cs)
	# create an analog input channel on pin 0
	chan0 = AnalogIn(mcp, MCP.P0)
except:
	pass

# ------------------------------------FUNCTIONS----------------------------------
# list input devices, p = pyAudio instance
def list_input_device(p):
	nDevices = p.get_device_count()
	print('Found input devices:')
	for i in range(nDevices):
		deviceInfo = p.get_device_info_by_index(i)
		devName = deviceInfo['name']
		print(f"Device ID {i}: {devName}")
		# print("Device Info: ")
		# print(deviceInfo)

def remap_range(value, left_min, left_max, right_min, right_max):
		# this remaps a value from original (left) range to new (right) range
		# Figure out how 'wide' each range is
		left_span = left_max - left_min
		right_span = right_max - right_min

		# Convert the left range into a 0-1 range (int)
		valueScaled = int(value - left_min) / int(left_span)

		# Convert the 0-1 range into a value in the right range.
		return int(right_min + (valueScaled * right_span))

def record():
	# recording config
	DEVICE = 0
	FORMAT = pyaudio.paInt32
	CHANNELS = 1
	RATE = 44100
	CHUNK = 1024
	RECORD_SECONDS = 5
	OUTPUT_FILENAME = "recording.wav"
	MP3_FILENAME = "recording"

	# are we using the right pyaudio device?
	list_input_device(audio)
	print("using device", DEVICE)

	# start index at 0
	index = 0

	while True:
		# recording
		stream = audio.open(format=FORMAT, channels=CHANNELS,
							rate=RATE, input=True, input_device_index=DEVICE,
							frames_per_buffer=CHUNK)
		frames = []
		print("Recording started...")
		for i in range(0, int(RATE / CHUNK * RECORD_SECONDS)):
			data = stream.read(CHUNK)
			frames.append(data)
		print("Recording finished.")

		# stop stream - might prevent pyAudio issues
		stream.stop_stream()
		stream.close()

		# generate .wav file
		with wave.open(OUTPUT_FILENAME, 'wb') as wf:
			wf.setnchannels(CHANNELS)
			wf.setsampwidth(audio.get_sample_size(FORMAT))
			wf.setframerate(RATE)
			wf.writeframes(b''.join(frames))

		# convert .wav to .mp3
		MP3_FILENAME_ALL = MP3_FILENAME + str(index) + ".mp3"
		mp3 =  pydub.AudioSegment.from_wav(OUTPUT_FILENAME)
		mp3.export(MP3_FILENAME_ALL, format="mp3")

		# increment index
		index = index + 1

		# remove .wav file
		try:
			os.remove("recording.wav")
		except:
			pass

def synthesis(transcription):
	# whisper config
	WHISPER_TEMP = 0
	WHISPER_CONTEXT_LENGTH = 400 # context characters to feed into whisper

	# keep track of index
	MP3_FILENAME = "recording"
	index = 0

	# tts initialization
	engine = pyttsx3.init()

	# Set properties _before_ you add things to say
	engine.setProperty('rate', 50)    # Speed percent (can go over 100)

	while True:
		try:
			MP3_FILENAME_ALL = MP3_FILENAME + str(index) + ".mp3"
			audio_file = open(MP3_FILENAME_ALL, 'rb')
			# transcribe audio with OpenAI whisper and save
			current_transcription = client.audio.transcriptions.create(model="whisper-1",
																file=audio_file,
																# [-x:] gets last x characters of string
																prompt=transcription.value[-WHISPER_CONTEXT_LENGTH:],
																temperature=WHISPER_TEMP,
																response_format="text")
			transcription.value += " " # add a space for readability
			transcription.value = current_transcription
			print("transcription:", transcription.value)

			# increment index
			index = index + 1

			# remove the file
			os.remove(MP3_FILENAME_ALL)

			# response
			output = client.chat.completions.create(
				model="gpt-4-turbo-preview",
				messages=[
				{"role": "system", "content": "You are the spymaster of the world's best, most top secret spy organization. Mentor, teach, and support your spy through the spy walkie-talkie. Don't talk directly about who you are or your organization, be discreet but helpful, and be very concise."},
				{"role": "user", "content": transcription.value}
			  ]
			)
			response = output.choices[0].message.content
			print("response: ", response)
			engine.say(response)
			engine.runAndWait()
		except:
			pass

def sensors(inputs):
	# keeps tracks of the buttons
	oldVol = 0
	oldLev = 0
	oldBut = 0

	last_read = 0       # this keeps track of the last potentiometer value
	tolerance = 250     # to keep from being jittery we'll only change
	# volume when the pot has moved a significant amount
	# on a 16-bit ADC

	while True:
		# read GPIO pins
		try:
			if GPIO.input(vol) == GPIO.HIGH:
				inputs[0] = 0
			elif GPIO.input(vol) == GPIO.LOW:
				inputs[0] = 1
			if GPIO.input(lev) == GPIO.HIGH:
				inputs[1] = 1
			elif GPIO.input(lev) == GPIO.LOW:
				inputs[1] = 0
			if GPIO.input(but) == GPIO.HIGH:
				inputs[2] = 0
			elif GPIO.input(but) == GPIO.LOW:
				inputs[2] = 1
			# only print if the volume switch changed
			if oldVol != inputs[0] or oldLev != inputs[1] or oldBut != inputs[2]:
				oldVol = inputs[0]
				oldLev = inputs[1]
				oldBut = inputs[2]
				print("volume switch is ", inputs[0], " lever is ", inputs[1], " button is ", inputs[2])
		except:
			pass

		# read potentiometer
		try:
			# we'll assume that the pot didn't move
			trim_pot_changed = False
			# read the analog pin
			trim_pot = chan0.value
			# how much has it changed since the last read?
			pot_adjust = abs(trim_pot - last_read)
			if pot_adjust > tolerance:
				trim_pot_changed = True
			if trim_pot_changed:
				# convert 16bit adc0 (0-65535) trim pot read into 0-100 volume level
				inputs[3] = remap_range(trim_pot, 0, 65535, 0, 100)
				# set OS volume playback volume
				print('Volume = {volume}%' .format(volume = inputs[3]))
				#set_vol_cmd = 'sudo amixer cset numid=1 -- {volume}% > /dev/null' \
				#.format(volume = inputs[3])
				#os.system(set_vol_cmd)
				# save the potentiometer reading for the next loop
				last_read = trim_pot
		except:
			pass
# --------------------------------------------------------------------------------

# startup pyAudio
audio = pyaudio.PyAudio()

if __name__ == '__main__':
	# start transcription with current time
	manager = multiprocessing.Manager()
	transcription = manager.Value(c_char_p, str(datetime.now()))

	# set up the prompt
	prompt = manager.Value(c_char_p, transcription.value)
	response = manager.Value(c_char_p, str())

	# set the buttons and volume
	inputs = multiprocessing.Array('d', 4)

	# delete old recordings - might prevent recording issues
	try:
		os.remove("recording.wav")
	except:
		pass

	# main loop
	sensing = Process(target=sensors, args=(inputs,))
	recording = Process(target=record)
	synthesizing = Process(target=synthesis, args=(transcription,))
	sensing.start()
	recording.start()
	synthesizing.start()
	sensing.join()
	recording.join()
	synthesizing.join()

	# cleanup
	audio.terminate()