[pdpd] Specify SEQ_LEN for each batch (#8057)

* Specify SEQ_LEN for each batch * Generate different seq_len for each batch * Remove print
2021-10-27 14:00:13 +08:00 · 2021-10-27 14:00:13 +08:00 · 3ce0f2573a
commit 3ce0f2573a
parent bf8f9164ed
3 changed files with 61 additions and 18 deletions
--- a/ngraph/frontend/paddlepaddle/src/op/lstm.cpp
+++ b/ngraph/frontend/paddlepaddle/src/op/lstm.cpp
@ -94,12 +94,16 @@ struct LSTMNgInputMap {
        auto batch_size_node =
            std::make_shared<opset6::Gather>(shape_of_x, opset6::Constant::create(element::i64, Shape{1}, {0}), axes);
        if (node.has_ng_input("SequenceLength")) {
            m_input_map[LSTMInput::LSTM_INPUT_SEQ_LENGTHS] = node.get_ng_input("SequenceLength");
        } else {
            auto seq_length_node =
-            std::make_shared<opset6::Gather>(shape_of_x, opset6::Constant::create(element::i64, Shape{1}, {1}), axes);
+                std::make_shared<opset6::Gather>(shape_of_x,
-
+                                                 opset6::Constant::create(element::i64, Shape{1}, {1}),
-        // TODO Specify SEQ_LEN for each batch #55404
+                                                 axes);
            m_input_map[LSTMInput::LSTM_INPUT_SEQ_LENGTHS] =
                std::make_shared<opset6::Broadcast>(seq_length_node, batch_size_node);
        }
        auto init_states = node.get_ng_inputs("PreState");
        // 0 for init_h, 1 for init_cell, update bidirect_len for init states
--- a/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp
+++ b/ngraph/test/frontend/paddlepaddle/op_fuzzy.cpp
@ -189,6 +189,8 @@ static const std::vector<std::string> models{std::string("argmax"),
                                             std::string("rnn_lstm_layer_1_forward"),
                                             std::string("rnn_lstm_layer_2_bidirectional"),
                                             std::string("rnn_lstm_layer_2_forward"),
                                             std::string("rnn_lstm_layer_1_forward_seq_len_4"),
                                             std::string("rnn_lstm_layer_2_bidirectional_seq_len_4"),
                                             std::string("scale_bias_after_float32"),
                                             std::string("scale_bias_after_int32"),
                                             std::string("scale_bias_after_int64"),
--- a/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_rnn_lstm.py
+++ b/ngraph/test/frontend/paddlepaddle/test_models/gen_scripts/generate_rnn_lstm.py
@ -3,7 +3,7 @@ from save_model import saveModel
 import sys
-def pdpd_rnn_lstm(input_size, hidden_size, layers, direction):
+def pdpd_rnn_lstm(input_size, hidden_size, layers, direction, seq_len):
    import paddle as pdpd
    pdpd.enable_static()
    main_program = pdpd.static.Program()
@ -14,22 +14,40 @@ def pdpd_rnn_lstm(input_size, hidden_size, layers, direction):
        rnn = pdpd.nn.LSTM(input_size, hidden_size, layers, direction)
-        data = pdpd.static.data(name='x', shape=[4, 3, input_size], dtype='float32')
+        data = pdpd.static.data(
-        prev_h = pdpd.ones(shape=[layers * num_of_directions, 4, hidden_size], dtype=np.float32)
+            name='x', shape=[4, 3, input_size], dtype='float32')
-        prev_c = pdpd.ones(shape=[layers * num_of_directions, 4, hidden_size], dtype=np.float32)
+        prev_h = pdpd.ones(
            shape=[layers * num_of_directions, 4, hidden_size], dtype=np.float32)
        prev_c = pdpd.ones(
            shape=[layers * num_of_directions, 4, hidden_size], dtype=np.float32)
        if seq_len:
            seq_lengths = pdpd.static.data(name='sl', shape=[4], dtype='int32')
            y, (h, c) = rnn(data, (prev_h, prev_c), seq_lengths)
        else:
            y, (h, c) = rnn(data, (prev_h, prev_c))
        cpu = pdpd.static.cpu_places(1)
        exe = pdpd.static.Executor(cpu[0])
        exe.run(startup_program)
        if seq_len:
            outs = exe.run(
-            feed={'x': np.ones([4, 3, input_size]).astype(np.float32)},
+                feed={'x': np.ones([4, 3, input_size]).astype(
                    np.float32), 'sl': np.array(seq_len).astype(np.int32)},
                fetch_list=[y, h, c],
                program=main_program)
            saveModel("rnn_lstm_layer_" + str(layers) + '_' + str(direction) + '_seq_len_' + str(len(seq_len)), exe, feedkeys=['x', 'sl'],
                      fetchlist=[y, h, c], inputs=[np.ones([4, 3, input_size]).astype(np.float32), np.array(seq_len).astype(np.int32)], outputs=[outs[0], outs[1], outs[2]], target_dir=sys.argv[1])
        else:
            outs = exe.run(
                feed={'x': np.ones([4, 3, input_size]).astype(
                    np.float32)},
                fetch_list=[y, h, c],
                program=main_program)
            saveModel("rnn_lstm_layer_" + str(layers) + '_' + str(direction), exe, feedkeys=['x'],
                      fetchlist=[y, h, c], inputs=[np.ones([4, 3, input_size]).astype(np.float32)], outputs=[outs[0], outs[1], outs[2]], target_dir=sys.argv[1])
    return outs[0]
@ -41,26 +59,45 @@ if __name__ == "__main__":
            'hidden_size': 2,
            'layers': 1,
            'direction': 'forward',
            'seq_len': [],
        },
        {
            'input_size': 2,
            'hidden_size': 2,
            'layers': 1,
            'direction': 'bidirectional',
            'seq_len': [],
        },
        {
            'input_size': 2,
            'hidden_size': 2,
            'layers': 2,
            'direction': 'forward',
            'seq_len': [],
        },
        {
            'input_size': 2,
            'hidden_size': 2,
            'layers': 2,
            'direction': 'bidirectional',
            'seq_len': [],
        },
        {
            'input_size': 2,
            'hidden_size': 2,
            'layers': 1,
            'direction': 'forward',
            'seq_len': [1, 2, 3, 3],
        },
        {
            'input_size': 2,
            'hidden_size': 2,
            'layers': 2,
            'direction': 'bidirectional',
            'seq_len': [2, 2, 3, 3],
        }
    ]
    for test in testCases:
-        pdpd_rnn_lstm(test['input_size'], test['hidden_size'], test['layers'], test['direction'])
+        pdpd_rnn_lstm(test['input_size'], test['hidden_size'],
                      test['layers'], test['direction'], test['seq_len'])