Skip to content

Commit

Permalink
Avoid generating variables for RNNs without biases. (LaurentMazare#303)
Browse files Browse the repository at this point in the history
  • Loading branch information
LaurentMazare authored Dec 18, 2020
1 parent c298235 commit c30de83
Show file tree
Hide file tree
Showing 2 changed files with 20 additions and 8 deletions.
20 changes: 12 additions & 8 deletions src/nn/rnn.rs
Original file line number Diff line number Diff line change
Expand Up @@ -102,12 +102,14 @@ pub fn lstm(vs: &super::var_store::Path, in_dim: i64, hidden_dim: i64, c: RNNCon
&format!("weight_hh_l{}{}", layer_idx, suffix),
&[gate_dim, hidden_dim],
);
let b_ih = vs.zeros(&format!("bias_ih_l{}{}", layer_idx, suffix), &[gate_dim]);
let b_hh = vs.zeros(&format!("bias_hh_l{}{}", layer_idx, suffix), &[gate_dim]);
flat_weights.push(w_ih);
flat_weights.push(w_hh);
flat_weights.push(b_ih);
flat_weights.push(b_hh);
if c.has_biases {
let b_ih = vs.zeros(&format!("bias_ih_l{}{}", layer_idx, suffix), &[gate_dim]);
let b_hh = vs.zeros(&format!("bias_hh_l{}{}", layer_idx, suffix), &[gate_dim]);
flat_weights.push(b_ih);
flat_weights.push(b_hh);
}
}
}
if vs.device().is_cuda() && crate::Cuda::cudnn_is_available() {
Expand Down Expand Up @@ -206,12 +208,14 @@ pub fn gru(vs: &super::var_store::Path, in_dim: i64, hidden_dim: i64, c: RNNConf
&format!("weight_hh_l{}{}", layer_idx, suffix),
&[gate_dim, hidden_dim],
);
let b_ih = vs.zeros(&format!("bias_ih_l{}{}", layer_idx, suffix), &[gate_dim]);
let b_hh = vs.zeros(&format!("bias_hh_l{}{}", layer_idx, suffix), &[gate_dim]);
flat_weights.push(w_ih);
flat_weights.push(w_hh);
flat_weights.push(b_ih);
flat_weights.push(b_hh);
if c.has_biases {
let b_ih = vs.zeros(&format!("bias_ih_l{}{}", layer_idx, suffix), &[gate_dim]);
let b_hh = vs.zeros(&format!("bias_hh_l{}{}", layer_idx, suffix), &[gate_dim]);
flat_weights.push(b_ih);
flat_weights.push(b_hh);
}
}
}
if vs.device().is_cuda() && crate::Cuda::cudnn_is_available() {
Expand Down
8 changes: 8 additions & 0 deletions tests/nn_tests.rs
Original file line number Diff line number Diff line change
Expand Up @@ -165,6 +165,10 @@ fn gru_test(rnn_config: nn::RNNConfig) {
#[test]
fn gru() {
gru_test(Default::default());
gru_test(nn::RNNConfig {
has_biases: false,
..Default::default()
});
gru_test(nn::RNNConfig {
bidirectional: true,
..Default::default()
Expand Down Expand Up @@ -210,6 +214,10 @@ fn lstm_test(rnn_config: nn::RNNConfig) {
#[test]
fn lstm() {
lstm_test(Default::default());
lstm_test(nn::RNNConfig {
has_biases: false,
..Default::default()
});
lstm_test(nn::RNNConfig {
bidirectional: true,
..Default::default()
Expand Down

0 comments on commit c30de83

Please sign in to comment.