-
Notifications
You must be signed in to change notification settings - Fork 3
Expand file tree
/
Copy pathglobal_values.py
More file actions
80 lines (68 loc) · 2.72 KB
/
global_values.py
File metadata and controls
80 lines (68 loc) · 2.72 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import os
import config
BASE_DIR = '/home/yzk/dds-avec2019/'
TRAIN_SET_NAME = 'train_split_Depression_AVEC2017.csv'
DEL_SET_NAME = 'dev_split_Depression_AVEC2017.csv'
# COVAREP's clomuns
COVAREP_COLUMNS = ['F0', 'VUV', 'NAQ', 'QOQ', 'H1H2', 'HRF', 'PSP', 'MDQ', 'peakSlope',
'Rd', 'Rd_conf']
for i in range(25): COVAREP_COLUMNS.append('MCEP_' + str(i))
for i in range(25): COVAREP_COLUMNS.append('HMPDM_' + str(i))
for i in range(13): COVAREP_COLUMNS.append('HMPDD_' + str(i))
"""
F0 - Fundamental Frequnency; 原始的声带振动频率,决定了声音的初始音高;一般是在语谱图中最低的共振峰;
VUV - 0,1 表示声音的有无
NAQ - Normalized amplitude quotient
QOQ - quasi-open quotient
-------------以下是频域
H1H2 - the difference in amplitude of the first two harmonics of the differentiated glottal source spectrum
HRF - Harmonic richness factor
PSP - Parabolic spectral parameter
MDQ - The Maxima Dispersion Quotient (MDQ) quantifies how impulse-like the
glottal excitation is through wavelet analysis of the Linear Prediction(LP) residual
peakSlope - A parameter which is essentially a correlate of spectral tilt, derived
following wavelet analysis. This parameter is effective at discriminating
lax-tense phonation types
---------- 主要针对LF model
Rd - estimation of the LF glottal model using Mean Squared Phase (MSP)
Rd_conf - a confidence value between 0 (lowest confidence) to 1 (best confidence).
This last value describes how well the glottal model fits the signal.
---------- HM 谐波模型 主要研究谐波的相位表示
HM PDD - Phase Distortion 导数
HM PDM - Phase Distortion Mean
"""
PREFIX = [folder[:-1] for folder in os.listdir(config.data_dir + '/avec') \
if folder.endswith('P')]
IDS = [item[:3] for item in PREFIX]
SUFFIX = {
'wav': 'AUDIO.wav',
'face_3d': 'CLNF_features3D.txt',
'face_2d': 'CLNF_features.txt',
'gaze': 'CLNF_gaze.txt',
'pose': 'CLNF_pose.txt',
'formant': 'FORMANT.csv',
'text': 'TRANSCRIPT.csv',
'au': 'CLNF_AUs.txt',
'hog': 'CLNF_hog.bin',
'covarep': 'COVAREP.csv'
}
# formant.csv columns
FORMANT_COLUMNS = ['formant_0', 'formant_1', 'formant_2', 'formant_3', 'formant_4']
# column name of video
POSE_COLUMNS = ['Tx', 'Ty', 'Tz', 'Rx', 'Ry', 'Rz']
EXP1_FACE_COLUMNS = ['right_eye_h', 'left_eye_h', 'left_eye_v', 'right_eye_v',
'mouth_v', 'mouth_h', 'eyebrow_h', 'eyebrow_v']
# feature's name
FEATURE_EXP_1 = 'exp1'
FEATURE_EXP_2 = 'exp2'
FEATURE_BL = 'baseline'
# model's name
MODEL_RF = 'rf'
AUDIO_TABLE = set([
config.tbl_exp2_audio_fea
])
VIDEO_TABLE = set([
config.tbl_exp1_face_fea,
config.tbl_exp1_head_fea
])
TEXT_TABLE = set([])