resPyre/deep/BigSmall/predict_vitals.py at main · phuselab/resPyre · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
import torch
from .BigSmall import BigSmall
import numpy as np
import cv2
from .preprocess import preprocess_frames, extract_raw
import os
from scipy import signal
from scipy.signal import butter, filtfilt
import matplotlib.pyplot as plt
from collections import OrderedDict

def format_data_shape(data):
    base_len = 3
    # reshape big data
    data_big = data[0]
    data_big = torch.swapaxes(data_big, 2, 4)
    N, D, C, H, W = data_big.shape
    data_big = data_big.view(N * D, C, H, W)
    # reshape small data
    data_small = data[1]
    data_small = torch.swapaxes(data_small, 2, 4)
    N, D, C, H, W = data_small.shape
    data_small = data_small.view(N * D, C, H, W)

    # If using temporal shift module
    #if self.using_TSM:
    data_big = data_big[:(N * D) // base_len * base_len]
    data_small = data_small[:(N * D) // base_len * base_len]
    data[0] = data_big
    data[1] = data_small
    return data


def send_data_to_device(data, device):
    big_data = data[0].to(device)
    small_data = data[1].to(device)
    data = (big_data, small_data)
    return data


def define_model():
    # BigSmall Model
    model = BigSmall(n_segment=3)
    frame_depth = 3
    base_len = 1 * frame_depth
    return model

##########################################################
######################### CONFIGS ########################
##########################################################

# CONFIGURATION DICTIONARY
config_preprocess = dict()
# Data / Frame Processing
config_preprocess['BIG_DATA_TYPE'] = ["Standardized"] # Default: ["Standardized"]
config_preprocess['BIG_W'] = 144 # Default: 144
config_preprocess['BIG_H'] = 144 # Default: 144
config_preprocess['SMALL_DATA_TYPE'] = ["Normalized"] # Default: ["Normalized"]
config_preprocess['SMALL_W'] = 9 # Default: 9
config_preprocess['SMALL_H'] = 9 # Default: 9
# Resize Parameters
config_preprocess['DYNAMIC_DETECTION'] = False # Default: False
config_preprocess['DYNAMIC_DETECTION_FREQUENCY'] = False # Default: False
config_preprocess['LARGE_FACE_BOX'] = False # Default: False
config_preprocess['CROP_FACE'] = False # Default: False
config_preprocess['LARGE_BOX_COEF'] = False # Default: False
config_preprocess['DATASET'] = 'bp4d'


##########################################################
######################### MAIN ###########################
##########################################################


def predict_vitals(frames):
    #frames = extract_raw(videoFileName)
    big_clip, small_clip = preprocess_frames(frames, config_preprocess)
    data = [torch.Tensor(big_clip), torch.Tensor(small_clip)]

    """ Model evaluation on the testing dataset."""
    print("\n=== Loading pretrained weights ===\n")

    model_path = "deep/BigSmall/checkpoints/BP4D_BigSmall_Multitask_Fold1.pth"
    print("Testing uses pretrained model!")
    print('Model path:', model_path)
    if not os.path.exists(model_path):
        raise ValueError("Inference model path error!")

    model = define_model() # define the model

    '''
    # LOAD ABOVED SPECIFIED MODEL FOR TESTING
    if torch.cuda.is_available():
        device = torch.device("cuda:0") # set device to primary GPU
    else:
        device = "cpu" # if no GPUs set device is CPU'''

    device = 'cpu'

    weights =  torch.load(model_path, map_location=torch.device(device))
    w = OrderedDict({k.replace('module.', ''): v  for k,v in weights.items()})
    model.load_state_dict(w)
    model = model.to(device)
    model.eval()

    print("\n=== Inference ===\n")

    # MODEL TESTING
    with torch.no_grad():
        # GATHER AND FORMAT BATCH DATA
        data = format_data_shape(data)
        data = send_data_to_device(data, device)

        # GET MODEL PREDICTIONS
        _, _, resp_out = model(data)

    resp_out_np = resp_out.cpu().detach().numpy()

    del model
    torch.cuda.empty_cache()

    return resp_out_np

'''
if __name__ == "__main__":

    parser = argparse.ArgumentParser()
    parser.add_argument('--video_path', type=str, help='processed video path')
    parser.add_argument('--sampling_rate', type=int, default = 30, help='sampling rate of your video')
    args = parser.parse_args()

    sample_data_path = args.video_path

    resp_out = predict_vitals(sample_data_path)

    print("\n=== Plotting ===\n")

    resp_sig = np.squeeze(resp_out.detach().cpu().numpy())
    b, a = butter(N=2, Wn=[0.1, 0.5], fs=25, btype='bandpass')
    filtered_sig = filtfilt(b, a, resp_sig)

    #WELCH Estimations params
    fps = 25
    win_size = 30
    nyquistF_est = fps/2
    fRes = 0.1
    nFFT_est = max(2048, (60*2*nyquistF_est) / fRes)
    minF = 0
    maxF = 0.65

    F, P = signal.welch(filtered_sig, nperseg=win_size*fps, noverlap=fps*(win_size-1), fs=fps, nfft=nFFT_est)
    band = np.argwhere((F > 0.1) & (F < 0.65)).flatten()
    RR = F[band][np.argmax(P[band])] * 60

    plt.plot(filtered_sig)
    plt.grid()
    plt.figure()
    plt.plot(F,P)
    plt.grid()
    plt.axvline(x=0.1, ymin=0, ymax=1, c='r')
    plt.axvline(x=maxF, ymin=0, ymax=1, c='r')
    plt.xlim([0,maxF+0.5])
    plt.title("RR: "+str(round(RR,2))+" resp/min")
    plt.show()
'''