rediska0123's picture
Uploading model
dce12d3
raw
history blame contribute delete
413 Bytes
feature_extractor:
- name: luq.feature_extractors.basic_hidden_states
layer_nums:
- -1
- -5
- -16
- name: luq.feature_extractors.basic_attention
layer_nums:
- -1
- -5
- -10
- -16
- -20
- -25
- name: luq.feature_extractors.token_probabilities
top_n: 3
uncertainty_head:
head_dim: 4096
n_layers: 1
n_heads: 32
dropout: 0.1
enable_feature_projection_layer: true
interim_dim: 1024