diff --git "a/compressed_graph.dot" "b/compressed_graph.dot" new file mode 100644--- /dev/null +++ "b/compressed_graph.dot" @@ -0,0 +1,1274 @@ +strict digraph { +"0 /nncf_model_input_0"; +"1 /nncf_model_input_1"; +"2 GPT2LMHeadModel/GPT2Model[transformer]/view_0"; +"3 GPT2LMHeadModel/GPT2Model[transformer]/view_1"; +"4 GPT2LMHeadModel/GPT2Model[transformer]/__getitem___0"; +"5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0"; +"6 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wpe]/embedding_0"; +"7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0"; +"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0"; +"9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0"; +"14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0"; +"15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0"; +"16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1"; +"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1"; +"18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2"; +"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2"; +"20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0"; +"21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0"; +"22 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_0"; +"23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0"; +"24 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_1"; +"25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0"; +"26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0"; +"27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0"; +"28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0"; +"29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1"; +"31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3"; +"32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0"; +"33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3"; +"34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0"; +"39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1"; +"56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0"; +"61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0"; +"62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0"; +"63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1"; +"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1"; +"65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2"; +"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2"; +"67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0"; +"68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0"; +"69 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_0"; +"70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0"; +"71 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_1"; +"72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0"; +"73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0"; +"74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0"; +"75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0"; +"76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1"; +"78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3"; +"79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0"; +"80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3"; +"81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0"; +"86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1"; +"103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0"; +"108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0"; +"109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0"; +"110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1"; +"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1"; +"112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2"; +"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2"; +"114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0"; +"115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0"; +"116 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_0"; +"117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0"; +"118 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_1"; +"119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0"; +"120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0"; +"121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0"; +"122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0"; +"123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1"; +"125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3"; +"126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0"; +"127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3"; +"128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0"; +"133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1"; +"150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0"; +"155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0"; +"156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0"; +"157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1"; +"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1"; +"159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2"; +"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2"; +"161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0"; +"162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0"; +"163 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_0"; +"164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0"; +"165 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_1"; +"166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0"; +"167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0"; +"168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0"; +"169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0"; +"170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1"; +"172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3"; +"173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0"; +"174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3"; +"175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0"; +"180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1"; +"197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0"; +"202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0"; +"203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0"; +"204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1"; +"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1"; +"206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2"; +"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2"; +"208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0"; +"209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0"; +"210 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_0"; +"211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0"; +"212 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_1"; +"213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0"; +"214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0"; +"215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0"; +"216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0"; +"217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1"; +"219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3"; +"220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0"; +"221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3"; +"222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0"; +"227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1"; +"244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0"; +"249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0"; +"250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0"; +"251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1"; +"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1"; +"253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2"; +"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2"; +"255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0"; +"256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0"; +"257 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_0"; +"258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0"; +"259 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_1"; +"260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0"; +"261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0"; +"262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0"; +"263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0"; +"264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1"; +"266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3"; +"267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0"; +"268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3"; +"269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0"; +"274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1"; +"291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0"; +"296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0"; +"297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0"; +"298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1"; +"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1"; +"300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2"; +"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2"; +"302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0"; +"303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0"; +"304 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_0"; +"305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0"; +"306 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_1"; +"307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0"; +"308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0"; +"309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0"; +"310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0"; +"311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1"; +"313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3"; +"314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0"; +"315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3"; +"316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0"; +"321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1"; +"338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0"; +"343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0"; +"344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0"; +"345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1"; +"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1"; +"347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2"; +"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2"; +"349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0"; +"350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0"; +"351 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_0"; +"352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0"; +"353 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_1"; +"354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0"; +"355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0"; +"356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0"; +"357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0"; +"358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1"; +"360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3"; +"361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0"; +"362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3"; +"363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0"; +"368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1"; +"385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0"; +"390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0"; +"391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0"; +"392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1"; +"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1"; +"394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2"; +"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2"; +"396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0"; +"397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0"; +"398 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_0"; +"399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0"; +"400 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_1"; +"401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0"; +"402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0"; +"403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0"; +"404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0"; +"405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1"; +"407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3"; +"408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0"; +"409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3"; +"410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0"; +"415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1"; +"432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0"; +"437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0"; +"438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0"; +"439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1"; +"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1"; +"441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2"; +"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2"; +"443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0"; +"444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0"; +"445 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_0"; +"446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0"; +"447 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_1"; +"448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0"; +"449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0"; +"450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0"; +"451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0"; +"452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1"; +"454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3"; +"455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0"; +"456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3"; +"457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0"; +"462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1"; +"479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0"; +"484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0"; +"485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0"; +"486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1"; +"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1"; +"488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2"; +"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2"; +"490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0"; +"491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0"; +"492 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_0"; +"493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0"; +"494 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_1"; +"495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0"; +"496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0"; +"497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0"; +"498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0"; +"499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1"; +"501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3"; +"502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0"; +"503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3"; +"504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0"; +"509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1"; +"526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0"; +"527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0"; +"528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0"; +"529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1"; +"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0"; +"531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0"; +"532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0"; +"533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1"; +"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1"; +"535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2"; +"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2"; +"537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0"; +"538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0"; +"539 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_0"; +"540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0"; +"541 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_1"; +"542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0"; +"543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0"; +"544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0"; +"545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0"; +"546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0"; +"547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1"; +"548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3"; +"549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0"; +"550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3"; +"551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0"; +"552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0"; +"553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1"; +"554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0"; +"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0"; +"556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0"; +"557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0"; +"558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0"; +"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1"; +"560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0"; +"561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0"; +"562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1"; +"563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0"; +"564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2"; +"565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0"; +"566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0"; +"567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0"; +"568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0"; +"569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0"; +"570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1"; +"571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0"; +"572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1"; +"573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0"; +"574 GPT2LMHeadModel/GPT2Model[transformer]/view_2"; +"575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0"; +"576 /nncf_model_output_0"; +"577 /nncf_model_output_1"; +"578 /nncf_model_output_2"; +"579 /nncf_model_output_3"; +"580 /nncf_model_output_4"; +"581 /nncf_model_output_5"; +"582 /nncf_model_output_6"; +"583 /nncf_model_output_7"; +"584 /nncf_model_output_8"; +"585 /nncf_model_output_9"; +"586 /nncf_model_output_10"; +"587 /nncf_model_output_11"; +"588 /nncf_model_output_12"; +"589 /nncf_model_output_13"; +"590 /nncf_model_output_14"; +"591 /nncf_model_output_15"; +"592 /nncf_model_output_16"; +"593 /nncf_model_output_17"; +"594 /nncf_model_output_18"; +"595 /nncf_model_output_19"; +"596 /nncf_model_output_20"; +"597 /nncf_model_output_21"; +"598 /nncf_model_output_22"; +"599 /nncf_model_output_23"; +"600 /nncf_model_output_24"; +"0 /nncf_model_input_0" -> "2 GPT2LMHeadModel/GPT2Model[transformer]/view_0" [label="(8, 1024) \n0 -> 0", style=dashed]; +"1 /nncf_model_input_1" -> "3 GPT2LMHeadModel/GPT2Model[transformer]/view_1" [label="(8, 1024) \n0 -> 0", style=dashed]; +"2 GPT2LMHeadModel/GPT2Model[transformer]/view_0" -> "5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0" [label="(8, 1024) \n0 -> 0", style=dashed]; +"3 GPT2LMHeadModel/GPT2Model[transformer]/view_1" -> "4 GPT2LMHeadModel/GPT2Model[transformer]/__getitem___0" [label="(8, 1024) \n0 -> 0", style=dashed]; +"5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0" -> "7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"6 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wpe]/embedding_0" -> "7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" [label="(1, 1024, 768) \n0 -> 1", style=solid]; +"7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" -> "8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" -> "9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" -> "38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0" -> "15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0" -> "21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1" -> "17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" -> "20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" -> "576 /nncf_model_output_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2" -> "19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" -> "30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" -> "577 /nncf_model_output_1" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0" -> "21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" -> "23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"22 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_0" -> "23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" -> "25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"24 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_1" -> "25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" -> "26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0" -> "27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0" -> "28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0" -> "29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" -> "31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3" -> "32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0" -> "33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3" -> "34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" -> "39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" -> "55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" -> "56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" -> "85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0" -> "62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0" -> "68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1" -> "64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" -> "67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" -> "578 /nncf_model_output_2" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2" -> "66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" -> "77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" -> "579 /nncf_model_output_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0" -> "68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" -> "70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"69 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_0" -> "70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" -> "72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"71 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_1" -> "72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" -> "73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0" -> "74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0" -> "75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0" -> "76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" -> "78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3" -> "79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0" -> "80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3" -> "81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" -> "86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" -> "102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" -> "103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" -> "132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0" -> "109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0" -> "115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1" -> "111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" -> "114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" -> "580 /nncf_model_output_4" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2" -> "113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" -> "124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" -> "581 /nncf_model_output_5" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0" -> "115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" -> "117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"116 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_0" -> "117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" -> "119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"118 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_1" -> "119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" -> "120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0" -> "121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0" -> "122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0" -> "123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" -> "125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3" -> "126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0" -> "127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3" -> "128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" -> "133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" -> "149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" -> "150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" -> "179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0" -> "156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0" -> "162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1" -> "158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" -> "161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" -> "582 /nncf_model_output_6" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2" -> "160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" -> "171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" -> "583 /nncf_model_output_7" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0" -> "162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" -> "164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"163 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_0" -> "164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" -> "166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"165 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_1" -> "166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" -> "167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0" -> "168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0" -> "169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0" -> "170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" -> "172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3" -> "173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0" -> "174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3" -> "175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" -> "180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" -> "196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" -> "197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" -> "226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0" -> "203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0" -> "209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1" -> "205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" -> "208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" -> "584 /nncf_model_output_8" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2" -> "207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" -> "218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" -> "585 /nncf_model_output_9" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0" -> "209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" -> "211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"210 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_0" -> "211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" -> "213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"212 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_1" -> "213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" -> "214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0" -> "215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0" -> "216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0" -> "217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" -> "219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3" -> "220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0" -> "221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3" -> "222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" -> "227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" -> "243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" -> "244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" -> "273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0" -> "250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0" -> "256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1" -> "252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" -> "255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" -> "586 /nncf_model_output_10" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2" -> "254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" -> "265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" -> "587 /nncf_model_output_11" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0" -> "256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" -> "258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"257 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_0" -> "258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" -> "260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"259 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_1" -> "260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" -> "261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0" -> "262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0" -> "263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0" -> "264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" -> "266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3" -> "267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0" -> "268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3" -> "269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" -> "274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" -> "290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" -> "291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" -> "320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0" -> "297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0" -> "303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1" -> "299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" -> "302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" -> "588 /nncf_model_output_12" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2" -> "301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" -> "312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" -> "589 /nncf_model_output_13" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0" -> "303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" -> "305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"304 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_0" -> "305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" -> "307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"306 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_1" -> "307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" -> "308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0" -> "309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0" -> "310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0" -> "311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" -> "313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3" -> "314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0" -> "315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3" -> "316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" -> "321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" -> "337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" -> "338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" -> "367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0" -> "344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0" -> "350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1" -> "346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" -> "349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" -> "590 /nncf_model_output_14" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2" -> "348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" -> "359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" -> "591 /nncf_model_output_15" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0" -> "350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" -> "352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"351 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_0" -> "352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" -> "354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"353 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_1" -> "354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" -> "355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0" -> "356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0" -> "357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0" -> "358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" -> "360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3" -> "361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0" -> "362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3" -> "363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" -> "368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" -> "384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" -> "385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" -> "414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0" -> "391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0" -> "397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1" -> "393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" -> "396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" -> "592 /nncf_model_output_16" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2" -> "395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" -> "406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" -> "593 /nncf_model_output_17" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0" -> "397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" -> "399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"398 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_0" -> "399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" -> "401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"400 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_1" -> "401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" -> "402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0" -> "403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0" -> "404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0" -> "405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" -> "407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3" -> "408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0" -> "409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3" -> "410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" -> "415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" -> "431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" -> "432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" -> "461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0" -> "438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0" -> "444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1" -> "440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" -> "443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" -> "594 /nncf_model_output_18" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2" -> "442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" -> "453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" -> "595 /nncf_model_output_19" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0" -> "444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" -> "446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"445 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_0" -> "446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" -> "448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"447 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_1" -> "448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" -> "449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0" -> "450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0" -> "451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0" -> "452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" -> "454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3" -> "455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0" -> "456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3" -> "457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" -> "462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" -> "478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" -> "479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" -> "508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0" -> "485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0" -> "491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1" -> "487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" -> "490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" -> "596 /nncf_model_output_20" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2" -> "489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" -> "500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" -> "597 /nncf_model_output_21" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0" -> "491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" -> "493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"492 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_0" -> "493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" -> "495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"494 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_1" -> "495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" -> "496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0" -> "497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0" -> "498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0" -> "499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" -> "501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3" -> "502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0" -> "503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3" -> "504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" -> "509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" -> "525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" -> "526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" -> "555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid]; +"529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid]; +"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid]; +"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid]; +"531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0" -> "532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0" -> "538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1" -> "534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" -> "537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" -> "598 /nncf_model_output_22" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2" -> "536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" -> "547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid]; +"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" -> "599 /nncf_model_output_23" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0" -> "538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid]; +"538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" -> "540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"539 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_0" -> "540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid]; +"540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" -> "542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid]; +"541 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_1" -> "542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid]; +"542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" -> "543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0" -> "544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0" -> "545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0" -> "546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid]; +"547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" -> "548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid]; +"548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3" -> "549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0" -> "550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid]; +"550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3" -> "551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" -> "556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" -> "572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid]; +"558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid]; +"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid]; +"567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid]; +"568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid]; +"569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid]; +"570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid]; +"572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" -> "573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0" -> "574 GPT2LMHeadModel/GPT2Model[transformer]/view_2" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"574 GPT2LMHeadModel/GPT2Model[transformer]/view_2" -> "575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0" [label="(8, 1024, 768) \n0 -> 0", style=solid]; +"575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0" -> "600 /nncf_model_output_24" [label="(8, 1024, 50257) \n0 -> 0", style=solid]; +}