learning_rate=0.0001
weight_decay=0.0001
batch=64
emd_dim=32
hidden_dim=64
out_dim=32
kernel_size=9
gru_nlayer=3
dropout=0.4
encoder=cnn,gru,fea,plm
