bilstm1  res = 0.752083426
input_keep_prob_ = 0.5
output_keep_prob_ = 0.5
lstmUnitNum = 128
attn_length = -1
attention_size = 256
layer_num = 2multi
forget_bias = 0.5

bilstm2  res = 0.758998285
input_keep_prob_ = 0.5
output_keep_prob_ = 0.5
lstmUnitNum = 128
attn_length = -1
attention_size = 256
layer_num = 2stack
forget_bias = 0.5

hbilstm1  res = 0.761818637
input_keep_prob_ = 0.5
output_keep_prob_ = 0.5
lstmUnitNum = 100
attn_length = -1
attention_size = 256
layer_num = 1
forget_bias = 0.5
input + output1 -> output2

hbilstm2  res = 0.762948876
input_keep_prob_ = 0.5
output_keep_prob_ = 0.5
lstmUnitNum = 100
attn_length = -1
attention_size = 256
layer_num = 1
forget_bias = 0.5
output1 + output2 -> output