2 years ago · 645d16540e
--- a/00_clip_video.py
+++ b/00_clip_video.py
@@ -0,0 +1,251 @@
 
															+
														
 
															+# This code clips the raw videos based on claps detected by the user during the execution and stores them in a new file
														
 
															+
														
 
															+import subprocess
														
 
															+import glob
														
 
															+import sounddevice as sd
														
 
															+import argparse
														
 
															+import os
														
 
															+
														
 
															+
														
 
															+from scipy.signal import butter, filtfilt
														
 
															+from scipy.io import wavfile
														
 
															+from pylab import *
														
 
															+
														
 
															+def butter_lowpass(cutoff_low, cutoff_high, fs, order=5):
														
 
															+    nyq = 0.5 * fs
														
 
															+    cutoff_low = cutoff_low / nyq
														
 
															+    cutoff_high = cutoff_high / nyq
														
 
															+    b, a = butter(order, [cutoff_low, cutoff_high], btype='bandpass',
														
 
															+                  analog=False)
														
 
															+    return b, a
														
 
															+
														
 
															+
														
 
															+def butter_lowpass_filter(data, cutoff_low, cutoff_high, fs, order=5):
														
 
															+    b, a = butter_lowpass(cutoff_low, cutoff_high, fs, order=order)
														
 
															+    y = filtfilt(b, a, data)
														
 
															+    return y
														
 
															+
														
 
															+
														
 
															+def find_start_frame_by_clap(path_to_audio_file, startt=0, stopt=500,
														
 
															+                             where=None):
														
 
															+    """
														
 
															+    Detect clap in audio file. Sound is played and detection must be confirmed
														
 
															+    by pressing [d] or discarded by pressing [e]. [c] to restart, [a] to
														
 
															+    listen again,
														
 
															+
														
 
															+    :param
														
 
															+    path_to_audio_file: path to .wav file
														
 
															+    startt: default 0, time in seconds to start search
														
 
															+    stopt: default 100, time in seconds to end search. By default only within
														
 
															+    the first minute and 30 seconds the clap is searched.
														
 
															+    where: valuesallowed are 'start' or 'end' if provided first half or last
														
 
															+    half resp. is set to zero
														
 
															+
														
 
															+    :return:
														
 
															+    second_of_clap: Second of .wav file in which clap takes place
														
 
															+    """
														
 
															+    audioFreq, audio = wavfile.read(path_to_audio_file)
														
 
															+    audio.setflags(write=1)
														
 
															+
														
 
															+    # set part of sequence to zero if searched for start / end clap
														
 
															+    if where != None:
														
 
															+        if where == 'end':
														
 
															+            audio[0:int(len(audio) / 2)] = 0
														
 
															+        elif where == 'start':
														
 
															+            audio[int(len(audio) / 2):len(audio)] = 0
														
 
															+        else:
														
 
															+            print('where must be \'start\' oder \'end\'')
														
 
															+
														
 
															+    cutoff_low = 1000  # desired cutoff frequency of the filter, Hz
														
 
															+    cutoff_high = 1400
														
 
															+    fs = 3000
														
 
															+    order = 5
														
 
															+
														
 
															+    foundStartClap = False
														
 
															+    k = 0
														
 
															+    while not foundStartClap:
														
 
															+        k += 10
														
 
															+        s = int(audioFreq * startt)
														
 
															+        e = int(audioFreq * (stopt + k))
														
 
															+        # Filter .wav file within given range of time and find argmax amplitude
														
 
															+        y = butter_lowpass_filter(audio[s:e, 0], cutoff_low,
														
 
															+                                  cutoff_high, fs, order)
														
 
															+        maxamp = np.argmax(y)
														
 
															+        # -/+ audioFreq is necessary to actually hear something (1 second)
														
 
															+        # when audio is played.
														
 
															+        l = int(maxamp - 2 * audioFreq)
														
 
															+        u = int(maxamp + 2 * audioFreq)
														
 
															+        print(l / audioFreq, u / audioFreq)
														
 
															+        sd.play(audio[l:u], audioFreq, blocking=True)
														
 
															+        print('Clap playing second: ', np.ceil(maxamp / audioFreq))
														
 
															+        # Capture keyboard events
														
 
															+        while True:
														
 
															+            print("Press [d] if clap was detected; [c] if sound was no clap; "
														
 
															+                  "[a] to hear again; [e] to pass; press [n] if clap not "
														
 
															+                  "found at all, second of clap will be set to one")
														
 
															+            x = input()
														
 
															+            if x == 'd':
														
 
															+                second_of_clap = maxamp / audioFreq
														
 
															+                print('Clap accepted; takes place at second ', second_of_clap)
														
 
															+                foundStartClap = True
														
 
															+                break
														
 
															+            elif x == 'c':
														
 
															+                print('Restart clap search')
														
 
															+                audio[l:u] = 0
														
 
															+                break
														
 
															+            elif x == 'a':
														
 
															+                sd.play(audio[l:u], audioFreq, blocking=True)
														
 
															+            elif x == 'e':
														
 
															+                return 0
														
 
															+            elif x == 'n':
														
 
															+                second_of_clap = 1
														
 
															+                foundStartClap = True
														
 
															+                print('Clap not found, video will start at ', second_of_clap)
														
 
															+                break
														
 
															+            else:
														
 
															+                print('Key must be [d],[c], [a] or [e]')
														
 
															+
														
 
															+    return second_of_clap
														
 
															+
														
 
															+def clip_video_from_clap(video_path, output_path, start_time, end_time):
														
 
															+
														
 
															+    command_clip = (
														
 
															+        f"ffmpeg -i {video_path} -ss {start_time} -to {end_time} -c copy {output_path}"
														
 
															+    )
														
 
															+    subprocess.call(command_clip, shell=True)
														
 
															+
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+
														
 
															+    """ 
														
 
															+    This script processes video all in once. The default directory for videos
														
 
															+    being processed is data/Videos. Frames are automatically extracted after
														
 
															+    clap detection finished. The following steps are performed:
														
 
															+        1) Create folder based on video name
														
 
															+        2) Extract audio file
														
 
															+        3) Clap detection (starting and ending clap) using low pass filter in 
														
 
															+        video for synchronization of the three cameras.
														
 
															+        Make sure sound is turned on. Clap detection results are written to 
														
 
															+        offset.csv. Headphones necessary to confirm detection.
														
 
															+        4) Extract video frames using ffmpeg
														
 
															+
														
 
															+        Args:
														
 
															+            inputpath: Path to folder with videos.
														
 
															+
														
 
															+        Returns:
														
 
															+            Folder containing audio file and video frames. Writes number of 
														
 
															+            frame where clap takes place and second of clap to offset.csv. 
														
 
															+    """
														
 
															+
														
 
															+    parser = argparse.ArgumentParser(description='Processes all Videos in '
														
 
															+                                                 '--inputpath at once')
														
 
															+    parser.add_argument('--inputpath',
														
 
															+                        default='/home/valapil/Project/ForkCausal_Adithya/raw_video/pair3',
														
 
															+                        help='Path to folder with videos to process')
														
 
															+    parser.add_argument('--outputpath',
														
 
															+                        default='/home/valapil/Project/ForkCausal_Adithya/clipped_vid',
														
 
															+                        help='Path to folder with pair-folders')
														
 
															+    parser.add_argument('--ExtractFrames', action='store_false',
														
 
															+                        help='If true frames are extracted from video')
														
 
															+    args = parser.parse_args()
														
 
															+    print(args, args.ExtractFrames)
														
 
															+
														
 
															+    # Comment in if side view perspective is processed as well.
														
 
															+    # videofiles = glob.glob(args.inputpath + '/*.MTS')
														
 
															+    # videofiles.extend(glob.glob(args.inputpath + '/*.MOV'))
														
 
															+    # videofiles = sorted(videofiles)
														
 
															+
														
 
															+    videofiles = sorted(glob.glob(args.inputpath + '/*.MTS'))
														
 
															+
														
 
															+    print('Videos to process: ', args.inputpath, videofiles)
														
 
															+
														
 
															+    f = open(os.path.join(args.outputpath, 'offset.csv'), 'a')
														
 
															+
														
 
															+    # Extract clap and audio
														
 
															+    for video_dir in videofiles:
														
 
															+
														
 
															+        accept_Video = True
														
 
															+        print('Processing video: ', video_dir)
														
 
															+
														
 
															+        video = os.path.basename(video_dir)
														
 
															+        video_file = os.path.basename(video).split('.')[0]
														
 
															+
														
 
															+        video_file = video_file.replace('r', 'o')
														
 
															+        print('PROCESS ', video_dir)
														
 
															+
														
 
															+        # Create directory for pair
														
 
															+        pair = 'pair_' + str(video_file[0:3])
														
 
															+        create_folder_pair = os.path.join(args.outputpath, pair)
														
 
															+        command_folder = "mkdir -p " + create_folder_pair
														
 
															+        subprocess.call(command_folder, shell=True)
														
 
															+
														
 
															+        # Create directory for images in outputpath
														
 
															+        create_folder_img = os.path.join(args.outputpath, pair,
														
 
															+                                         video_file, 'images')
														
 
															+        command_folder_img = "mkdir -p " + create_folder_img
														
 
															+        subprocess.call(command_folder_img, shell=True)
														
 
															+
														
 
															+        # Create directory for audio file in outputpath
														
 
															+        create_folder_audio = os.path.join(args.outputpath, pair,
														
 
															+                                           video_file, 'audio')
														
 
															+        command_folder_audio = "mkdir -p " + create_folder_audio
														
 
															+        subprocess.call(command_folder_audio, shell=True)
														
 
															+
														
 
															+        # Extract audio from video
														
 
															+        aud = os.path.join(create_folder_audio,
														
 
															+                           video_file + "_audio.wav")
														
 
															+        command_audio = "ffmpeg -i " + video_dir + \
														
 
															+                        " -ab 160k -ac 2 -ar 44100 -vn " + aud
														
 
															+        subprocess.call(command_audio, shell=True)
														
 
															+
														
 
															+        # Detect strating and ending claps in video
														
 
															+        for i in ['start', 'end']:
														
 
															+            second_of_clap = find_start_frame_by_clap(path_to_audio_file
														
 
															+                                                      =aud, where=i)
														
 
															+            # Video camera from media department format
														
 
															+            if os.path.basename(video).split('.')[1] == 'MTS':
														
 
															+                frame_rate = 25
														
 
															+                frame_of_clap = int(second_of_clap * frame_rate)
														
 
															+            # ipad video format
														
 
															+            elif os.path.basename(video).split('.')[1] == 'MOV':
														
 
															+                # original frame rate is of .MOV is 29.984664, but side
														
 
															+                # view should be synchronized with frontal perspective
														
 
															+                frame_rate = 25
														
 
															+                frame_of_clap = int(second_of_clap * frame_rate)
														
 
															+
														
 
															+            print(video_file, i, second_of_clap, frame_of_clap)
														
 
															+
														
 
															+            if i == 'start':
														
 
															+                start_clip = second_of_clap
														
 
															+            elif i == 'end':
														
 
															+                if second_of_clap == start_clip:
														
 
															+                    accept_Video = False
														
 
															+                else:
														
 
															+                    end_clip = second_of_clap
														
 
															+
														
 
															+        if accept_Video == True:
														
 
															+            clip_output_path = os.path.join(create_folder_pair, video_file, f"{video}_clipped.mp4")
														
 
															+            clip_video_from_clap(video_path=video_dir, output_path=clip_output_path, start_time=start_clip, end_time= end_clip)
														
 
															+            # f.write(f'{video_file} {i} {second_of_clap} {frame_of_clap}\n')
														
 
															+
														
 
															+    f.close()
														
 
															+
														
 
															+    # # Extract video frames to pair/condition/images
														
 
															+    # if args.ExtractFrames:
														
 
															+    #     print('Start extracting frames ... ')
														
 
															+    #     for video_dir in videofiles:
														
 
															+    #         video = os.path.basename(video_dir)
														
 
															+    #         video_file = os.path.basename(video).split('.')[0]
														
 
															+    #         # you can exclude videos (e.g. sideview)
														
 
															+    #         # processedVideos = ['I am already processed']
														
 
															+    #         # if np.isin(video_file, processedVideos, invert=True):
														
 
															+    #         pair = 'pair_' + str(video_file[0:3])
														
 
															+    #         create_folder_pair = os.path.join(args.outputpath, pair)
														
 
															+    #         create_folder = os.path.join(create_folder_pair, video_file,
														
 
															+    #                                      'images')
														
 
															+    #         vid = create_folder + '/' + video_file + '_%05d.png'
														
 
															+    #
														
 
															+    #         # Call from shell
														
 
															+    #         command_frames = "ffmpeg -i " + video_dir + " -r 25 " + vid
														
 
															+    #         subprocess.call(command_frames, shell=True)
														
--- a/02_process_offset.py
+++ b/02_process_offset.py
@@ -0,0 +1,68 @@
 
															+# use the openface 2 to get the action units before this
														
 
															+# go to- valapil@hemera4:~/Programs/OpenFace$
														
 
															+# type- ./bin/FeatureExtraction -f "/home/valapil/Project/ForkCausal_Adithya/clipped_vid/pair_021/021S3o/021S3o.MTS_clipped.mp4"
														
 
															+
														
 
															+# also get the offset values
														
 
															+
														
 
															+import numpy as np
														
 
															+import os
														
 
															+
														
 
															+
														
 
															+AU = ["Person", "Case", "AU01", "AU02", "AU04", "AU05", "AU06", "AU07", "AU09","AU10","AU12","AU14","AU15","AU17","AU20","AU23",
														
 
															+      "AU25","AU26", "AU45"]
														
 
															+off = ["Case", "Start", "End", "Person"]
														
 
															+
														
 
															+# folder where output csv files of OpenFace are stored
														
 
															+folder = '/home/valapil/Project/ForkCausal_Adithya/csv_files'
														
 
															+csv_files = [file for file in os.listdir(folder) if file.endswith('.csv')]
														
 
															+
														
 
															+def loadOffset():
														
 
															+    """
														
 
															+    get offset values for video frames
														
 
															+    :param basepath: path to where offset.csv is at
														
 
															+    :return: dictionary with {identifier: offset}('002S1g': 7}
														
 
															+    """
														
 
															+
														
 
															+    # opening the file where offset values are present
														
 
															+    with open(os.path.join('/home/valapil/Project/ForkCausal_Adithya/offset.csv'), 'r') as f:
														
 
															+        f.readline() # read header
														
 
															+        offset = {}
														
 
															+        for row in f:
														
 
															+            id, StartEnd, second, frame = row.split(' ')[0:4]
														
 
															+            if id not in offset:
														
 
															+                offset[id] = {}
														
 
															+            offset[id][StartEnd] = int(np.ceil(float(frame)))
														
 
															+        return offset
														
 
															+
														
 
															+
														
 
															+for file in csv_files:
														
 
															+    base_name, extension = os.path.splitext(file)
														
 
															+    new_name = base_name.split('.')[0]
														
 
															+    f1 = new_name[:-2]
														
 
															+    f2 = new_name[-1:]
														
 
															+    file_path = os.path.join(folder, file)
														
 
															+
														
 
															+    offset = loadOffset()
														
 
															+    if new_name[-5] != '0':
														
 
															+        offset_file = np.hstack((new_name[:-3] + new_name[-1], offset[new_name]['start'], offset[new_name]['end'], new_name))
														
 
															+    else:
														
 
															+        offset_file = np.hstack((new_name[:-3] + new_name[-1], offset['0' + new_name]['start'], offset['0' + new_name]['end'], new_name))
														
 
															+
														
 
															+    off = np.row_stack((off, offset_file))
														
 
															+
														
 
															+# file where offset values are stored as npy format
														
 
															+np.save(f'/home/valapil/Project/ForkCausal_Adithya/offset_values.npy', off)
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
--- a/03_process_data.py
+++ b/03_process_data.py
@@ -0,0 +1,42 @@
 
															+import numpy as np
														
 
															+import os
														
 
															+
														
 
															+
														
 
															+AU = ["Person", "Case", "Confidence", "AU01", "AU02", "AU04", "AU05", "AU06", "AU07", "AU09","AU10","AU12","AU14","AU15","AU17","AU20","AU23",
														
 
															+  "AU25","AU26", "AU45"]
														
 
															+
														
 
															+# folder where output csv files of OpenFace are stored
														
 
															+folder = '/home/valapil/Project/ForkCausal_Adithya/csv_files'
														
 
															+csv_files = [file for file in os.listdir(folder) if file.endswith('.csv')]
														
 
															+
														
 
															+# load the offset values
														
 
															+offset = np.load(f'/home/valapil/Project/ForkCausal_Adithya/offset_values.npy')
														
 
															+length = {}
														
 
															+same = np.unique(offset[1:, 0])
														
 
															+for i in same:
														
 
															+    same_rows = offset[offset[:, 0] == i]
														
 
															+    length[i] = max(abs(int(same_rows[0][2]) - int(same_rows[0][1])), abs(int(same_rows[1][2]) - int(same_rows[1][1])))
														
 
															+
														
 
															+for file in csv_files:
														
 
															+    base_name, extension = os.path.splitext(file)
														
 
															+    new_name = base_name.split('.')[0]
														
 
															+    f1 = new_name[:-2]
														
 
															+    f2 = new_name[-1:]
														
 
															+    file_path = os.path.join(folder, file)
														
 
															+    len = length[new_name[:-3] + new_name[-1]]
														
 
															+    start = np.where(offset[1:, 3]  == new_name)[0][0]
														
 
															+    start = int(offset[start+1, 1])
														
 
															+    data_all = np.genfromtxt(file_path, delimiter=',', skip_header=1)
														
 
															+    data = data_all[start:len-200, 679:696]
														
 
															+
														
 
															+    selected_columns = np.hstack((np.full((data.shape[0], 2), [f1, f2]), data_all[start:len-200, [3]], data))
														
 
															+
														
 
															+    AU = np.row_stack((AU, selected_columns))
														
 
															+
														
 
															+    #  save each offset data here
														
 
															+    np.save(f'/home/valapil/Project/ForkCausal_Adithya/data/{new_name}.npy', data)
														
 
															+
														
 
															+#  save all offset data with the particular case and confidence value here
														
 
															+np.save(f'/home/valapil/Project/ForkCausal_Adithya/processed_data.npy', AU)
														
 
															+
														
 
															+
														
--- a/04_get_expression.py
+++ b/04_get_expression.py
@@ -0,0 +1,95 @@
 
															+import numpy as np
														
 
															+from numpy import save
														
 
															+import os
														
 
															+
														
 
															+
														
 
															+# AU = ["AU01", "AU02", "AU04", "AU05", "AU06", "AU07", "AU09","AU10","AU12","AU14","AU15","AU17","AU20","AU23",
														
 
															+#       "AU25","AU26","AU45","AU01_c","AU02_c","AU04_c","AU05_c","AU06_c","AU07_c","AU09_c","AU10_c","AU12_c","AU14_c","AU15_c","AU17_c",
														
 
															+#       "AU20_c","AU23_c","AU25_c","AU26_c","AU28_c","AU45_c"]
														
 
															+
														
 
															+reference_au = ["File", "AU01", "AU02", "AU04", "AU05", "AU06", "AU07", "AU09","AU10","AU12","AU14","AU15","AU17","AU20","AU23",
														
 
															+      "AU25","AU26", "AU45"]
														
 
															+
														
 
															+
														
 
															+# finding reference values
														
 
															+ref_au = {}
														
 
															+ref = []
														
 
															+
														
 
															+#  get all offset data
														
 
															+data_all = np.load(f'/home/valapil/Project/ForkCausal_Adithya/processed_data.npy')
														
 
															+# data = np.concatenate(data_all[:3], data_all[4:])
														
 
															+data = np.delete(data_all, 2,1)
														
 
															+activation = []
														
 
															+
														
 
															+
														
 
															+unique = np.unique(data[1:, 0])
														
 
															+
														
 
															+for i in unique:
														
 
															+    same_rows = data[data[:, 0] == i]
														
 
															+    mean = np.mean(same_rows[:, 2:19].astype(np.float64), axis=0)
														
 
															+    std = np.std(same_rows[:, 2:19].astype(np.float64), axis=0)
														
 
															+    ref_au = mean + (0.5 * std)
														
 
															+    # ref_au.append(mean + (0.5 * std))
														
 
															+    ref = np.hstack((i, ref_au))
														
 
															+    reference_au = np.row_stack((reference_au, ref))
														
 
															+
														
 
															+# folder where each offset data is stored
														
 
															+folder = '/home/valapil/Project/ForkCausal_Adithya/data'
														
 
															+csv_files = [file for file in os.listdir(folder) if file.endswith('.npy')]
														
 
															+
														
 
															+
														
 
															+
														
 
															+for file in csv_files:
														
 
															+    EXP = ["Happiness upper", "Happiness lower", "Surprise upper", "Surprise lower", "Disgust lower", "Fear upper",
														
 
															+            "Fear lower", "Sadness upper", "Sadness lower", "Anger upper", "Anger lower"]
														
 
															+
														
 
															+    # Get data
														
 
															+    file_path = os.path.join(folder,file)
														
 
															+    # data = np.genfromtxt(file_path, delimiter=',', skip_header=1)
														
 
															+    data = np.load(file_path)
														
 
															+
														
 
															+    # find the particular person
														
 
															+    base_name, extension = os.path.splitext(file)
														
 
															+    new_name = base_name.split('.')[0]
														
 
															+    f1 = new_name[:-2]
														
 
															+    selected_columns = data
														
 
															+
														
 
															+    index = np.where(reference_au[1:, 0] == f1)[0]
														
 
															+
														
 
															+    # AU activation
														
 
															+    change = np.subtract(selected_columns, reference_au[index+1, 1:].astype(np.float16))
														
 
															+    activation = np.where(change >= 0, 1, 0)
														
 
															+
														
 
															+    expression_labels = np.zeros((activation.shape[0], 11), dtype=int)
														
 
															+
														
 
															+    # Define expressions based on specific AUs
														
 
															+    expression_labels[:, 0] = np.any(activation[:, [4]], axis=1)  # AU06 is 4th au in order. [4] to get results with []
														
 
															+    expression_labels[:, 1] = np.all(activation[:, [8, 14]], axis=1)  # AU12 and AU25
														
 
															+    expression_labels[:, 2] = np.all(activation[:, [0, 1, 3]], axis=1)  # AU01, AU02, AU05
														
 
															+    expression_labels[:, 3] = np.any(activation[:, [15]], axis=1)  # AU26
														
 
															+    expression_labels[:, 4] = np.all(activation[:, [6, 7, 14]], axis=1)  # AU09, AU10, AU25
														
 
															+    expression_labels[:, 5] = np.all(activation[:, [0, 1, 2, 3]], axis=1)  # AU01, AU02, AU04, AU05
														
 
															+    expression_labels[:, 6] = np.all(activation[:, [12, 14]], axis=1)  # AU20, AU25
														
 
															+    expression_labels[:, 7] = np.all(activation[:, [0, 2]], axis=1)  # AU01, AU04
														
 
															+    expression_labels[:, 8] = np.all(activation[:, [10, 11]], axis=1)  # AU15, AU17
														
 
															+    expression_labels[:, 9] = np.all(activation[:, [2, 3, 5]], axis=1)  # AU04, AU05, AU07
														
 
															+    expression_labels[:, 10] = np.all(activation[:, [11, 13]], axis=1)  # AU17, AU23
														
 
															+
														
 
															+    EXP = np.row_stack((EXP, expression_labels))
														
 
															+
														
 
															+    # Save the result to a new NumPy file
														
 
															+    # Each file has expressions for each frame based on activation of AU in that frame
														
 
															+    np.save(f'/home/valapil/Project/ForkCausal_Adithya/test/{new_name}.npy', EXP)
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
--- a/05_wilcoxon.py
+++ b/05_wilcoxon.py
@@ -0,0 +1,128 @@
 
															+# normalisation and results for wilcoxon test
														
 
															+
														
 
															+import numpy as np
														
 
															+import pandas as pd
														
 
															+from numpy import load
														
 
															+from numpy import save
														
 
															+import os
														
 
															+from scipy.stats import wilcoxon
														
 
															+
														
 
															+# folder where expression activation per frame of each pair is stored
														
 
															+expressions_folder = '/home/valapil/Project/ForkCausal_Adithya/test/'
														
 
															+
														
 
															+# EXP = ["CASE", "Happiness", "Surprise", "Disgust", "Fear", "Sadness", "Anger"]
														
 
															+
														
 
															+EXP = ["pair", "role", "case", "Happiness upper", "Happiness lower", "Surprise upper", "Surprise lower", "Disgust lower", "Fear upper",
														
 
															+        "Fear lower", "Sadness upper", "Sadness lower", "Anger upper", "Anger lower"]
														
 
															+
														
 
															+
														
 
															+np_files = [file for file in os.listdir(expressions_folder)]
														
 
															+
														
 
															+expr_sum = None
														
 
															+
														
 
															+frames = {}
														
 
															+
														
 
															+# get frames
														
 
															+for file in np_files:
														
 
															+    file_path = os.path.join(expressions_folder, file)
														
 
															+    data = np.load(file_path)
														
 
															+    base_name, extension = os.path.splitext(file)
														
 
															+    new_name = base_name.split('.')[0]
														
 
															+    frames[new_name] = data.shape[0]
														
 
															+
														
 
															+# normalisation 1
														
 
															+for file in np_files:
														
 
															+    file_path = os.path.join(expressions_folder, file)
														
 
															+    data = np.load(file_path)
														
 
															+    data = data[1:, :].astype(np.float64)
														
 
															+
														
 
															+    base_name, extension = os.path.splitext(file)
														
 
															+    new_name = base_name.split('.')[0]
														
 
															+    frame = min(frames[new_name[:-3] + 'S' + new_name[-2:]], frames[new_name[:-3] + 'E' + new_name[-2:]])
														
 
															+    expr_sum = np.sum(data, axis=0)
														
 
															+    norm_frames = np.divide(100 * expr_sum, frame)
														
 
															+
														
 
															+    total = np.hstack((new_name[:-3], new_name[-3], new_name[-1], norm_frames))
														
 
															+    EXP = np.row_stack((EXP, total))
														
 
															+
														
 
															+# normalisation 2
														
 
															+df = pd.DataFrame(EXP[1:, :])
														
 
															+df.columns = ["pair", "role", "case", "Happiness upper", "Happiness lower", "Surprise upper", "Surprise lower",
														
 
															+              "Disgust lower", "Fear upper", "Fear lower", "Sadness upper", "Sadness lower", "Anger upper", "Anger lower"]
														
 
															+
														
 
															+num_col = ["Happiness upper", "Happiness lower", "Surprise upper", "Surprise lower",
														
 
															+              "Disgust lower", "Fear upper", "Fear lower", "Sadness upper", "Sadness lower", "Anger upper", "Anger lower"]
														
 
															+df[num_col] = df[num_col].apply(pd.to_numeric, errors='coerce')
														
 
															+
														
 
															+# aumax1 = df.groupby(['pair', 'role']).sum()
														
 
															+aumax2 = df.groupby(['pair', 'role'])[num_col].transform('sum')
														
 
															+
														
 
															+
														
 
															+result = EXP[1:,:].copy()
														
 
															+result[:, 3:] = df[num_col] / aumax2
														
 
															+
														
 
															+
														
 
															+# need to group by case
														
 
															+s1 = np.sum(EXP[1:, 3:].astype(np.float64), axis=0)
														
 
															+s2 = np.multiply((np.divide(s1, sum(s1))), 100)
														
 
															+
														
 
															+output = ["Happiness upper", "Happiness lower", "Surprise upper", "Surprise lower", "Disgust lower", "Fear upper",
														
 
															+        "Fear lower", "Sadness upper", "Sadness lower", "Anger upper", "Anger lower"]
														
 
															+# output = np.row_stack((output , s2))
														
 
															+
														
 
															+print(output, s2)
														
 
															+
														
 
															+benjhoch = []
														
 
															+testresult = {}
														
 
															+intersect = []
														
 
															+
														
 
															+# Wilcoxon test
														
 
															+# for expr in range(0, output.shape[1]):
														
 
															+for expr, value in enumerate(output):
														
 
															+    for cond in [['g', 'a'], ['a', 'o'], ['g', 'o']]:
														
 
															+        index = np.where(result[:, 2] == cond[0])[0]
														
 
															+        x = result[index, 3+expr].astype(np.float64)
														
 
															+        index = np.where(result[:, 2] == cond[1])[0]
														
 
															+        y = result[index, 3+expr].astype(np.float64)
														
 
															+        res = wilcoxon(x=x, y=y, zero_method='pratt')
														
 
															+        benjhoch += [[value, res[1], cond[0], cond[1]]]
														
 
															+        testresult[value] = [cond, res]
														
 
															+
														
 
															+
														
 
															+Q = 0.3
														
 
															+benjhoch = np.array(benjhoch,dtype=object)
														
 
															+benjhoch = np.column_stack((benjhoch[benjhoch[:, 1].argsort()],
														
 
															+                            np.arange(1, len(benjhoch) + 1)))
														
 
															+print('Benjamini Hochberg Table: \n', benjhoch)
														
 
															+m = len(output) * 3
														
 
															+
														
 
															+# Find maximum rank where actual p-value is smaller
														
 
															+# than hochberg-benjamini p-value
														
 
															+maxi = 0
														
 
															+for i, val in enumerate(benjhoch):
														
 
															+    if float(val[1]) < (int(val[4]) / m) * Q:
														
 
															+        maxi = i
														
 
															+
														
 
															+# Check if test results is significant when using a Benjamini Hochberg
														
 
															+# p-value corretion
														
 
															+print(maxi + 1, 'significantly changing expression(s): \n')
														
 
															+sigexpr = []
														
 
															+for val in benjhoch[:(maxi + 1)]:
														
 
															+    au = val[0]
														
 
															+    sigexpr += [au]
														
 
															+    index = np.where(result[:, 2] == [val[2]])[0]
														
 
															+    x = result[index, 3 + output.index(au)].astype(np.float64)
														
 
															+    index = np.where(result[:, 2] == [val[3]])[0]
														
 
															+    y = result[index, 3 + output.index(au)].astype(np.float64)
														
 
															+    res = wilcoxon(x=x, y=y, zero_method='pratt')
														
 
															+
														
 
															+    print('Expression: ', val[0], 'significantly changes between '
														
 
															+                                  'conditions', val[2], 'and', val[3])
														
 
															+
														
 
															+    print('Average expression activation \n',
														
 
															+          val[2], ':', np.nanmean(x), val[3], ':', np.nanmean(y), '\n')
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+# df.to_csv('/home/valapil/Project/ForkCausal_Adithya/analysis.csv', index=False)