2_categorize_app_basel.py

#!/usr/bin/env python3

'''
app to read in and classify chunks of audio
Meg Cychosz & Ronald Sprouse
UC Berkeley
Adapted by Luca Cavasso (Simon Fraser U) for BaSeL
'''

import tkinter as tk
import tkinter.font as tkFont
import pandas as pd
from tkinter import ttk
from tkinter.filedialog import askopenfilename
from tkinter.messagebox import showinfo, askyesno
from functools import partial
import os
import datetime
from pydub import AudioSegment
from pydub.playback import play
from playsound import playsound


# set duration of audio you want to annotate
desired_duration = 60 * 60	 # in seconds

#number of minute-audio-clips in folder; index of row in df
idx = 0
config_df = None
row = None
resp_df = None

duration_so_far = 0		# default value - nothing annotated so far
job_done = False		# will be true when we're done annotating
# if you want to change how many decimals the "annotation complete" window shows:
minute_decimals = 2

# play_sound() will try pydub and use playsound as backup, then remember which one worked
# to make this happen, need to start with default audioplayer variable
audioplayer = False


def play_sound(filepath):
	print('trying to play', filepath)
	global audioplayer
	if audioplayer == 'pydub':
		sound = AudioSegment.from_wav(filepath)
		play(sound)
	elif audioplayer == 'playsound':
		playsound(filepath)
	elif not audioplayer:
		try:
			# first try pydub
			print("trying pydub")
			sound = AudioSegment.from_wav(filepath)
			play(sound)
			# if it worked, keep using this pydub
			audioplayer = 'pydub'
		except Exception as e:
			# print any error message for reference
			print(e)
			print()
			# then try playsound package
			print("trying playsound")
			playsound(filepath)
			# if it worked, keep using playsound
			audioplayer = 'playsound'

# clear category selection
def clear():
	beginoptionscat.set("Categorize clip")
	langcategory.set("Categorize language")
	speakercategory.set("Categorize speaker")
	registercategory.set("Categorize register")
	comments.delete(0, 'end')


# need to give multiple commands to button below
def combine_funcs(*funcs):
	def combined_func(*args, **kwargs):
		for f in funcs:
			f(*args, **kwargs)
	return combined_func


# check if we are done annotating
def check_done(source_df, annotated_dur, desired_dur=desired_duration):
	# return False if not done, 'enough' if you annotated enough, or 'no more' if there's no more valid audio
	# check if we've annotated enough
	if annotated_dur > desired_dur:
		print('You have annotated more than the minimum desired duration')
		return 'enough'
	# check if there are more rows
	elif len(source_df) == 0:
		print('There is no more audio for you to annotate')
		return 'no more'
	else:
		return False


# for putting time into a nice human readable format
def describe_time(duration_so_far):
	# report duration annotated in minutes to 2 decimal places
	if duration_so_far > 60:	# if duration > 1 min, print in min
		printed_duration = str(round(duration_so_far/60, minute_decimals))
		unit = 'minutes'
	else:
		printed_duration = str(int(duration_so_far))
		unit = 'seconds'
	description = printed_duration + ' ' + unit
	return description


# for notifying annotator that there's nothing left to code
def notify_finished(reason):
	global desired_duration
	global job_done
	job_done = True
	time_annotated = describe_time(duration_so_far)
	time_requested = describe_time(desired_duration)
	if reason == 'enough':
		finish_message = time_annotated + " of audio have been annotated out of " + time_requested + ". You can close this app."
	elif reason == 'no more':
		finish_message = time_annotated + " of audio have been annotated out of " + time_requested + ". There is no more audio for you to annotate. You can close this app."
	return showinfo('Annotation complete', finish_message) 


# get initial info about annotator
def annotatorinfo():
	global config_df
	global outdir
	global annotator_name

	# Get annotator's name
	annotate = tk.Toplevel()
	annotate.title("Annotator information")
	
	def close_window(annotate):
		annotate.destroy()

	tk.Label(annotate, text="What is your name?").grid(row=0)
	name = tk.Entry(annotate)
	def get_name():
		global annotator_name
		annotator_name = name.get()
	name.grid(row=0, column=1)

	tk.Button(annotate, text="Enter", command=combine_funcs(get_name, partial(close_window, annotate), get_resp_df)).grid(row=7,column=1,columnspan=2)


def get_resp_df():
	global config_df
	global outdir
	global annotator_name
	global resp_df
	global desired_duration
	global duration_so_far
	global resp_df_filepath
	resp_df_filename = 'responses_' + annotator_name.lower() + '.csv'
	resp_df_filepath = os.path.join(outdir, resp_df_filename)
	resp_df_exists = os.path.isfile(resp_df_filepath)
	if resp_df_exists:
		print('Writing responses to ' + resp_df_filepath)
		resp_df = pd.read_csv(resp_df_filepath) # if available, open the response df in read mode 
	else: # if not, confirm with user before creating
		confirm_create = askyesno(title='Response CSV not found', message='Could not find ' + resp_df_filename +'.\nCreate new file ' + resp_df_filename + '?')
		if confirm_create:
			empty = pd.DataFrame().assign(id=None, age_YYMMDD=None, date_YYYYMMDD=None, gender=None, file_name=None, percents_voc=None, outdir=None, researcher_present=None) # add addtl columns, file_name=None, 
			empty.to_csv(resp_df_filepath, index=False) 
			resp_df = pd.read_csv(resp_df_filepath)
		else:
			# try getting their name again
			return annotatorinfo()

	# we need to know the duration of clips that have been annotated so far
	if len(resp_df) > 0:
		# filter out anything annotated as non-speech
		filterdf = resp_df[resp_df['beginoptions'] != 'No speech']
		duration_so_far = sum(filterdf['duration'].tolist())
		# no change made to resp_df so that those annotations are preserved
	# it was already set to 0 at start of script, so no need for an else

	# we don't want to repeat any annotations. delete from df any rows with the same filename as one of the rows from resp_df
	forbidden_files = resp_df['file_name'].tolist()
	# if resp_df doesn't have any file names, we don't need to proceed
	if forbidden_files:
		# loop over df, check if its filename is in the prohibited list
		mask = config_df['file_name'].isin(forbidden_files)
		masked_df = config_df[mask]
		# get a list of indices for rows whose filenames we don't want to re-annotate
		forbidden_indices = [row.Index for row in masked_df.itertuples()]
		# drop them from df
		for i in forbidden_indices:
			config_df = config_df.drop(i, axis='index')
	# if config_df is empty, it means we don't have anything else to annotate
	reason_finished = check_done(config_df, duration_so_far)
	if reason_finished:
		notify_finished(reason_finished)
	if not reason_finished:
		# play first audio clip
		play_new_clip()


# go to the next audio file
def next_audio():
	global repeat_ct
	global duration_so_far
	global config_df
	global row
	global resp_df

	beginoptions = beginoptionscat.get() # get the speaker classification	
	language = langcategory.get() # get the classification
	speaker = speakercategory.get() 
	register = registercategory.get() 
	clip_comments = comments.get()
	annotate_date_YYYYMMDD = datetime.datetime.now() # get current annotation time
	print(beginoptions, language, speaker, register, annotate_date_YYYYMMDD, annotator_name, clip_comments) 

	allcols = pd.DataFrame([row]).assign(beginoptions=beginoptions, Language=language, Speaker=speaker,  Register=register, comments=clip_comments, annotate_date_YYYYMMDD=annotate_date_YYYYMMDD, annotator=annotator_name, repeats=repeat_ct) 
	resp_df = pd.concat([resp_df, allcols], sort=True)
	resp_df.to_csv(resp_df_filepath, index=False)  # this overwrites the file each time

	# update our duration counter
	duration_so_far += row['duration']

	# check if we are done, then ensure we don't pick this row again
	# check if we're done annotating
	reason_finished = check_done(config_df, duration_so_far)
	if reason_finished:
		notify_finished(reason_finished)
	else:
		# ensure we don't select this row in the future
		config_df = config_df.drop(row.name)  # .name is where the original index is stored
		global idx 
		idx += 1 # update the global idx
		repeat_ct = int(0)

#index and play audio file aloud
def play_new_clip():
	global repeat_ct
	repeat_ct = int(0) 
	global row
	global audiofile

	# check if there's anything left to annotate. if so, randomly pick a row
	reason_finished = check_done(config_df, duration_so_far)
	if reason_finished:
		notify_finished(reason_finished)
	else:
		row = config_df.iloc[0]			# select next row
		if row['researcher_present']==1:
			print('Researcher present in recording.')
		elif row['percents_voc']==0:	# if no vocal activity detected
			print('No vocal activity in clip.')
		elif row['sleeping']==1:		# if child is sleeping
			print('Child is sleeping.')
		audiofile = os.path.join(row.outdir, str(row.file_name))
		print(idx, row.file_name) # keep us updated
		play_sound(audiofile)


def next_and_play_audio():
	if not job_done:
		next_audio()
		play_new_clip()
	else:
		notify_finished()

	
def repeat():
	play_sound(audiofile)
	global repeat_ct
	repeat_ct = repeat_ct + 1


def main():
	global beginoptionscat
	global langcategory
	global speakercategory
	global registercategory
	global comments
	global outdir
	global config_df

	root = tk.Tk() # refers to annotation window 
	root.update()
	root.title("Categorize")

	frame = tk.Frame(root, bg="white")
	frame.grid(row=15, column=15)
	beginoptionscat = tk.StringVar()
	langcategory = tk.StringVar()
	speakercategory = tk.StringVar() 
	registercategory = tk.StringVar()

	# import dropdown menu choices. These should be specified in .txt files
	# that are in the same directory as this script.
	# find this script's filepath
	thisfilepath = os.path.dirname(os.path.realpath(__file__))
	# extrapolate txt files' paths
	beginoptions_path = os.path.join(thisfilepath, '2a_categorize_beginoptions.txt')
	lang_path = os.path.join(thisfilepath, '2b_categorize_language.txt')
	speaker_path = os.path.join(thisfilepath, '2c_categorize_speaker.txt')
	register_path = os.path.join(thisfilepath, '2d_categorize_register.txt')
	# read and process the txt files
	def read_options(filepath):
		with open(filepath) as file:
			options = file.readlines()
		# remove any newline characters from the end of lines
		for i in range(len(options)):
			while options[i][-1:] == '\r' or options[i][-1:] == '\n':
				options[i] = options[i][:-1]
		return options

	beginoptions_choices = read_options(beginoptions_path)
	lang_choices = read_options(lang_path)
	speaker_choices = read_options(speaker_path)
	register_choices = read_options(register_path)

	beginoptionscat.set("Categorize clip")
	langcategory.set("Categorize language")
	speakercategory.set("Categorize speaker")
	registercategory.set("Categorize register")

	popupMenu0 = tk.OptionMenu(frame, beginoptionscat, *beginoptions_choices)	
	popupMenu = tk.OptionMenu(frame, langcategory, *lang_choices)
	popupMenu1 = tk.OptionMenu(frame, speakercategory, *speaker_choices)
	popupMenu2 = tk.OptionMenu(frame, registercategory, *register_choices)

	popupMenu0.grid(row=3, column=1)
	popupMenu.grid(row=5, column=1)
	popupMenu1.grid(row=6, column=1)
	popupMenu2.grid(row=7, column=1)

	fontStyle = tkFont.Font(family="Lucida Grande", size=16, weight="bold")

	tk.Label(frame, font=fontStyle, text="Classify clip").grid(row=3, column=0)
	tk.Label(frame, text="Language: ").grid(row = 5, column = 0)
	tk.Label(frame, text="Speaker: ").grid(row = 6, column = 0)
	tk.Label(frame, text="Register:").grid(row=7, column=0)
	tk.Label(frame, font=fontStyle, text="Comments about clip?").grid(row=8, column=0)
	comments = tk.Entry(frame)
	comments.grid(row=8, column=1, columnspan=2)


	tk.Button(frame, background="gray", text="   Play   ", command=repeat).grid(row=1, column=0)
	tk.Button(frame, text="		Next	   ", command=combine_funcs(next_and_play_audio, clear), bg="gray").grid(row=1, column=2) 

	showinfo('Window', "Select a metadata file")
	fname = askopenfilename(filetypes =(("CSV File", "*.csv"),("all files","*.*")),
			 title = "Please choose a config.csv file")
	fname = os.path.normpath(fname)
	outdir = os.path.split(fname)[0]
	config_df = pd.read_csv(fname).assign(outdir=outdir) # the master config file
	annotatorinfo()
	root.mainloop()

if __name__ == "__main__":
	main()

pass