Skip to content

Commit

Permalink
Updated constants
Browse files Browse the repository at this point in the history
  • Loading branch information
dougollerenshaw committed Oct 8, 2024
1 parent 64b6647 commit e3a1c1d
Show file tree
Hide file tree
Showing 2 changed files with 12 additions and 223 deletions.
221 changes: 2 additions & 219 deletions codeaide/ui/chat_window.py
Original file line number Diff line number Diff line change
@@ -1,10 +1,5 @@
import signal
from PyQt5.QtCore import (
Qt,
QTimer,
QThread,
pyqtSignal,
)
from PyQt5.QtCore import Qt, QTimer
from PyQt5.QtGui import QColor
from PyQt5.QtWidgets import (
QApplication,
Expand All @@ -17,7 +12,6 @@
QWidget,
QComboBox,
QLabel,
QProgressDialog,
)
from codeaide.ui.code_popup import CodePopup
from codeaide.ui.example_selection_dialog import show_example_dialog
Expand All @@ -39,85 +33,6 @@
)
from codeaide.utils.logging_config import get_logger
from codeaide.ui.traceback_dialog import TracebackDialog
import os
import time
import sounddevice as sd
import numpy as np
from scipy.io import wavfile
import whisper


class AudioRecorder(QThread):
finished = pyqtSignal(str, float)

def __init__(self, filename):
super().__init__()
self.filename = filename
self.is_recording = False
self.start_time = None

def run(self):
RATE = 16000 # 16kHz to match Whisper's expected input
self.is_recording = True
self.start_time = time.time()
with sd.InputStream(samplerate=RATE, channels=1) as stream:
frames = []
while self.is_recording:
data, overflowed = stream.read(RATE)
if not overflowed:
frames.append(data)

audio_data = np.concatenate(frames, axis=0)
print(f"Raw audio data shape: {audio_data.shape}")
print(f"Raw audio data range: {audio_data.min()} to {audio_data.max()}")

# Ensure audio data is in the correct range for int16
audio_data = np.clip(audio_data * 32768, -32768, 32767).astype(np.int16)

wavfile.write(self.filename, RATE, audio_data)
end_time = time.time()
self.finished.emit(self.filename, end_time - self.start_time)

def stop(self):
self.is_recording = False


class TranscriptionThread(QThread):
finished = pyqtSignal(str)

def __init__(self, whisper_model, filename):
super().__init__()
self.whisper_model = whisper_model
self.filename = filename

def run(self):
print("Transcribing audio...")
read_start = time.time()
# Read the WAV file
sample_rate, audio_data = wavfile.read(self.filename)
read_end = time.time()
print(f"Time to read WAV file: {read_end - read_start:.2f} seconds")

print(f"Audio shape: {audio_data.shape}, Sample rate: {sample_rate}")
print(f"Audio duration: {len(audio_data) / sample_rate:.2f} seconds")

# Convert to float32 and normalize
audio_data = audio_data.astype(np.float32) / 32768.0

print(f"Audio data range: {audio_data.min()} to {audio_data.max()}")

# Transcribe
transcribe_start = time.time()
result = self.whisper_model.transcribe(audio_data)
transcribe_end = time.time()
transcribed_text = result["text"].strip()
print(f"Transcription: {transcribed_text}")
print(
f"Time for Whisper to transcribe: {transcribe_end - transcribe_start:.2f} seconds"
)
print("Transcription complete.")

self.finished.emit(transcribed_text)


class ChatWindow(QMainWindow):
Expand All @@ -135,11 +50,6 @@ def __init__(self, chat_handler):
self.setup_input_placeholder()
self.update_submit_button_state()

# Initialize Whisper model
print("Loading Whisper model...")
self.whisper_model = whisper.load_model("tiny")
print("Whisper model loaded.")

# Check API key status
if not self.chat_handler.api_key_valid:
self.waiting_for_api_key = True
Expand Down Expand Up @@ -208,34 +118,7 @@ def setup_ui(self):
self.input_text.setFixedHeight(100)
self.input_text.textChanged.connect(self.on_modify)
self.input_text.installEventFilter(self)

# Add record button
self.record_button = QPushButton("Record", self)
self.record_button.clicked.connect(self.toggle_recording)
self.record_button.setStyleSheet(
"""
QPushButton {
background-color: #4CAF50;
color: white;
border: none;
padding: 5px 10px;
text-align: center;
text-decoration: none;
font-size: 14px;
margin: 4px 2px;
border-radius: 12px;
}
QPushButton:hover {
background-color: #45a049;
}
"""
)

# Modify the input layout to include the record button
input_layout = QHBoxLayout()
input_layout.addWidget(self.record_button)
input_layout.addWidget(self.input_text)
main_layout.addLayout(input_layout)
main_layout.addWidget(self.input_text, stretch=1)

# Buttons
button_layout = QHBoxLayout()
Expand Down Expand Up @@ -562,103 +445,3 @@ def show_traceback_dialog(self, traceback_text):

def update_submit_button_state(self):
self.submit_button.setEnabled(bool(self.input_text.toPlainText().strip()))

def toggle_recording(self):
if not hasattr(self, "is_recording"):
self.is_recording = False

if not self.is_recording:
self.start_recording()
else:
self.stop_recording()

def start_recording(self):
self.is_recording = True
self.record_button.setText("Stop Recording")
self.record_button.setStyleSheet(
"""
QPushButton {
background-color: #f44336;
color: white;
border: none;
padding: 5px 10px;
text-align: center;
text-decoration: none;
font-size: 14px;
margin: 4px 2px;
border-radius: 12px;
}
QPushButton:hover {
background-color: #d32f2f;
}
"""
)
filename = os.path.expanduser("~/recorded_audio.wav")
self.recorder = AudioRecorder(filename)
self.recorder.finished.connect(self.on_recording_finished)
self.recorder.start()

def stop_recording(self):
if self.recorder:
print(f"Stop recording clicked at: {time.time():.2f}")
self.recorder.stop()
self.is_recording = False
self.record_button.setText("Record")
self.record_button.setStyleSheet(
"""
QPushButton {
background-color: #4CAF50;
color: white;
border: none;
padding: 5px 10px;
text-align: center;
text-decoration: none;
font-size: 14px;
margin: 4px 2px;
border-radius: 12px;
}
QPushButton:hover {
background-color: #45a049;
}
"""
)

def on_recording_finished(self, filename, recording_duration):
print(f"Recording saved to: {filename}")
print(f"Total recording time: {recording_duration:.2f} seconds")
transcription_start = time.time()
self.transcribe_audio(filename)
transcription_end = time.time()
print(
f"Total time from recording stop to transcription complete: {transcription_end - transcription_start:.2f} seconds"
)

def transcribe_audio(self, filename):
progress_dialog = QProgressDialog("Transcribing audio...", None, 0, 0, self)
progress_dialog.setWindowTitle("Please Wait")
progress_dialog.setWindowModality(Qt.WindowModal)
progress_dialog.setAutoClose(True)
progress_dialog.setAutoReset(True)
progress_dialog.setMinimumDuration(0)
progress_dialog.setValue(0)
progress_dialog.setMaximum(0) # This makes it an indeterminate progress dialog
progress_dialog.show()

self.transcription_thread = TranscriptionThread(self.whisper_model, filename)
self.transcription_thread.finished.connect(self.on_transcription_finished)
self.transcription_thread.finished.connect(progress_dialog.close)
self.transcription_thread.start()

def on_transcription_finished(self, transcribed_text):
# Insert transcribed text into the input text field
current_text = self.input_text.toPlainText()
if current_text:
new_text = current_text + " " + transcribed_text
else:
new_text = transcribed_text
self.input_text.setPlainText(new_text)

# Move cursor to the end of the text
cursor = self.input_text.textCursor()
cursor.movePosition(cursor.End)
self.input_text.setTextCursor(cursor)
14 changes: 10 additions & 4 deletions codeaide/utils/constants.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,13 @@
# UI Configuration
CHAT_WINDOW_WIDTH = 800
CHAT_WINDOW_HEIGHT = 600
INITIAL_MESSAGE = "I'm a code writing assistant. I can generate and run code for you. What would you like to do?\n\nThe more details you provide, the better I can help you. But I'll make some assumptions and ask for more information if needed."
INITIAL_MESSAGE = """
I'm a code writing assistant. I can generate and run code for you. What would you like to do?
The more details you provide, the better I can help you. But I'll make some assumptions and ask for more information if needed.
Either click the microphone button to record your request or type your request in the text box below.
"""

# Chat window styling
CHAT_WINDOW_WIDTH = 800
Expand Down Expand Up @@ -61,7 +67,7 @@
SYSTEM_PROMPT = """
You are an AI assistant specialized in providing coding advice and solutions. Your primary goal is to offer practical, working code examples while balancing the need for clarification with the ability to make reasonable assumptions. Follow these guidelines:
* Prioritize providing functional code: When asked for code solutions, aim to deliver complete, runnable Python code whenever possible.
* Always return complete, fully functional code. Never use ellipses (...) or comments like "other methods remain unchanged" to indicate omitted parts. Every method, function, and class must be fully implemented in each response.
* Always return complete, fully functional code. Never use ellipses (...) or comments like "other methods remain unchanged" to indicate omitted parts. Every method, function, and class must be fully implemented in each response.
* Never assume that a necessary support file exists unless explicitly stated in the user's query. If you need to create additional files (such as .wav files for game sound effects), include code that generates and saves them to the appropriate location within the response.
* If you do create support files, save them in a temporary location and include code to clean them up after use. Always use absolute paths when saving or referencing files.
* Ensure that all necessary imports are included: If the code requires specific libraries or modules, include the necessary import statements.
Expand Down Expand Up @@ -100,10 +106,10 @@
* All code must be contained within a single file. If the code requires multiple classes or functions, include them all in the same code block.
Remember, the goal is to provide valuable, working code solutions while maintaining a balance between making reasonable assumptions and seeking clarification when truly necessary.
Format your responses as a JSON object with six keys:
Format your responses as a JSON object with six keys:
* 'text': a string that contains any natural language explanations or comments that you think are helpful for the user. This should never be null or incomplete. If you mention providing a list or explanation, ensure it is fully included here. If you have no text response, provide a brief explanation of the code or the assumptions made.
* 'questions': an array of strings that pose necessary follow-up questions to the user
* 'code': a string with the properly formatted, complete code block. This must include all necessary components for the code to run, including any previously implemented methods or classes. This should be null only if you have questions or text responses but no code to provide.
* 'code': a string with the properly formatted, complete code block. This must include all necessary components for the code to run, including any previously implemented methods or classes. This should be null only if you have questions or text responses but no code to provide.
* 'code_version': a string that represents the version of the code. Start at 1.0 and increment for each new version of the code you provide. Use your judgement on whether to increment the minor or major component of the version. It is critical that version numbers never be reused during a chat and that the numbers always increment upward. This field should be null if you have no code to provide.
* 'version_description': a very short string that describes the purpose of the code and/or changes made in this version of the code since the last version. This should be null if you have questions or text responses but no code to provide.
* 'requirements': an array of strings listing any required Python packages or modules that are necessary to run the code. This should be null if no additional requirements are needed beyond the standard Python libraries.
Expand Down

0 comments on commit e3a1c1d

Please sign in to comment.