File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 6161#define KEY_SAM_N_EMBD " clip.vision.sam.embedding_length"
6262// audio-specific
6363#define KEY_AUDIO_PROJ_TYPE " clip.audio.projector_type" // for models with mixed modalities
64- #define KEY_A_NUM_MEL_BINS " clip.audio.num_mel_bins"
65- #define KEY_A_PROJ_STACK_FACTOR " clip.audio.projector.stack_factor"
66- #define KEY_A_CHUNK_SIZE " clip.audio.chunk_size"
67- #define KEY_A_CONV_KERNEL_SIZE " clip.audio.conv_kernel_size"
68- #define KEY_A_MAX_POS_EMB " clip.audio.max_pos_emb"
69- #define KEY_A_PROJ_WINDOW_SIZE " clip.audio.projector.window_size"
70- #define KEY_A_PROJ_DOWNSAMPLE_RATE " clip.audio.projector.downsample_rate"
71- #define KEY_A_PROJ_HEAD_COUNT " clip.audio.projector.head_count"
72- #define KEY_A_PROJ_LAYERNORM_EPS " clip.audio.projector.layer_norm_epsilon"
64+ #define KEY_A_NUM_MEL_BINS " clip.audio.num_mel_bins"
65+ #define KEY_A_PROJ_STACK_FACTOR " clip.audio.projector.stack_factor"
66+ #define KEY_A_CHUNK_SIZE " clip.audio.chunk_size"
67+ #define KEY_A_CONV_KERNEL_SIZE " clip.audio.conv_kernel_size"
68+ #define KEY_A_MAX_POS_EMB " clip.audio.max_pos_emb"
69+ #define KEY_A_PROJ_WINDOW_SIZE " clip.audio.projector.window_size"
70+ #define KEY_A_PROJ_DOWNSAMPLE_RATE " clip.audio.projector.downsample_rate"
71+ #define KEY_A_PROJ_HEAD_COUNT " clip.audio.projector.head_count"
72+ #define KEY_A_PROJ_LAYERNORM_EPS " clip.audio.projector.layer_norm_epsilon"
7373
7474
7575//
You can’t perform that action at this time.
0 commit comments