digraph { node1 [label="Input0 [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node4 [label="Embedding(32320, 1024, padding_idx=0) [forward_compute_time=0.073,backward_compute_time=6.949,activation_size=6291456.0,parameter_size=132382720.0]"] node5 [label="EmuBidirLSTM( (bidir): LSTM(1024, 1024, bidirectional=True) (layer1): LSTM(1024, 1024) (layer2): LSTM(1024, 1024) ) [forward_compute_time=5.247,backward_compute_time=0.016,activation_size=12582912.0,parameter_size=67174400.0]"] node2 [label="Input1 [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node6 [label="Dropout(p=0.2) [forward_compute_time=0.077,backward_compute_time=0.196,activation_size=12582912.0,parameter_size=0.0]"] node7 [label="LSTM(2048, 1024) [forward_compute_time=3.190,backward_compute_time=5.348,activation_size=[6291456.0, 131072.0, 131072.0],parameter_size=50364416.0]"] node8 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6291456.0,parameter_size=0.0]"] node9 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node10 [label="Dropout(p=0.2) [forward_compute_time=0.064,backward_compute_time=0.128,activation_size=6291456.0,parameter_size=0.0]"] node11 [label="LSTM(1024, 1024) [forward_compute_time=2.491,backward_compute_time=4.203,activation_size=[6291456.0, 131072.0, 131072.0],parameter_size=33587200.0]"] node12 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6291456.0,parameter_size=0.0]"] node13 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node14 [label="Add [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6291456.0,parameter_size=0.0]"] node15 [label="Dropout(p=0.2) [forward_compute_time=0.059,backward_compute_time=0.121,activation_size=6291456.0,parameter_size=0.0]"] node16 [label="LSTM(1024, 1024) [forward_compute_time=2.492,backward_compute_time=4.201,activation_size=[6291456.0, 131072.0, 131072.0],parameter_size=33587200.0]"] node17 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6291456.0,parameter_size=0.0]"] node18 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node19 [label="Add [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6291456.0,parameter_size=0.0]"] node3 [label="Input2 [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node21 [label="Embedding(32320, 1024, padding_idx=0) [forward_compute_time=0.066,backward_compute_time=0.328,activation_size=6291456.0,parameter_size=132382720.0]"] node20 [label="hidden [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node22 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node23 [label="RecurrentAttention( (rnn): LSTM(1024, 1024) (attn): BahdanauAttention( (linear_q): Linear(in_features=1024, out_features=1024, bias=False) (linear_k): Linear(in_features=1024, out_features=1024, bias=False) (dropout): Dropout(p=0) ) (dropout): Dropout(p=0) ) [forward_compute_time=4.546,backward_compute_time=6.141,activation_size=[6160384.0, 131072.0, 131072.0, 6160384.0, 288768.0],parameter_size=41979904.0]"] node24 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node25 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node26 [label="__getitem__(2) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node27 [label="__getitem__(3) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node28 [label="Dropout(p=0.2) [forward_compute_time=0.058,backward_compute_time=0.176,activation_size=6160384.0,parameter_size=0.0]"] node29 [label="Concat(2) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node30 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node31 [label="LSTM(2048, 1024) [forward_compute_time=3.151,backward_compute_time=5.288,activation_size=[6160384.0, 131072.0, 131072.0],parameter_size=50364416.0]"] node32 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node33 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node34 [label="Dropout(p=0.2) [forward_compute_time=0.061,backward_compute_time=0.174,activation_size=6160384.0,parameter_size=0.0]"] node35 [label="Concat(2) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node36 [label="__getitem__(2) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node37 [label="LSTM(2048, 1024) [forward_compute_time=3.145,backward_compute_time=5.306,activation_size=[6160384.0, 131072.0, 131072.0],parameter_size=50364416.0]"] node38 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node39 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node40 [label="Add [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node41 [label="Dropout(p=0.2) [forward_compute_time=0.055,backward_compute_time=0.198,activation_size=6160384.0,parameter_size=0.0]"] node42 [label="Concat(2) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node43 [label="__getitem__(3) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=0.0,parameter_size=0.0]"] node44 [label="LSTM(2048, 1024) [forward_compute_time=3.149,backward_compute_time=15.883,activation_size=[6160384.0, 131072.0, 131072.0],parameter_size=50364416.0]"] node45 [label="__getitem__(0) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node46 [label="__getitem__(1) [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=131072.0,parameter_size=0.0]"] node47 [label="Add [forward_compute_time=0.000,backward_compute_time=0.000,activation_size=6160384.0,parameter_size=0.0]"] node48 [label="Classifier( (classifier): Linear(in_features=1024, out_features=32320, bias=True) ) [forward_compute_time=5.609,backward_compute_time=1.227,activation_size=194437120.0,parameter_size=132512000.0]"] node1 -> node4 node4 -> node5 node5 -> node6 node2 -> node5 node2 -> node23 node6 -> node7 node7 -> node8 node7 -> node9 node8 -> node10 node8 -> node14 node10 -> node11 node11 -> node12 node11 -> node13 node12 -> node14 node14 -> node15 node14 -> node19 node15 -> node16 node16 -> node17 node16 -> node18 node17 -> node19 node19 -> node23 node3 -> node21 node21 -> node23 node20 -> node22 node20 -> node30 node20 -> node36 node20 -> node43 node22 -> node23 node23 -> node24 node23 -> node25 node23 -> node26 node23 -> node27 node24 -> node28 node26 -> node29 node26 -> node35 node26 -> node42 node28 -> node29 node29 -> node31 node30 -> node31 node31 -> node32 node31 -> node33 node32 -> node34 node32 -> node40 node34 -> node35 node35 -> node37 node36 -> node37 node37 -> node38 node37 -> node39 node38 -> node40 node40 -> node41 node40 -> node47 node41 -> node42 node42 -> node44 node43 -> node44 node44 -> node45 node44 -> node46 node45 -> node47 node47 -> node48 }