ov-gpt2-fp32-kv-cache / compressed_graph.dot
Vui Seng Chua
Add content
57022cc
raw
history blame contribute delete
No virus
237 kB
strict digraph {
"0 /nncf_model_input_0";
"1 /nncf_model_input_1";
"2 GPT2LMHeadModel/GPT2Model[transformer]/view_0";
"3 GPT2LMHeadModel/GPT2Model[transformer]/view_1";
"4 GPT2LMHeadModel/GPT2Model[transformer]/__getitem___0";
"5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0";
"6 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wpe]/embedding_0";
"7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0";
"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0";
"9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0";
"10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0";
"14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0";
"15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0";
"16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1";
"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1";
"18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2";
"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2";
"20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0";
"21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0";
"22 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_0";
"23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0";
"24 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_1";
"25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0";
"26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0";
"27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0";
"28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0";
"29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1";
"31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3";
"32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0";
"33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3";
"34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0";
"39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0";
"40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1";
"56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0";
"57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0";
"61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0";
"62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0";
"63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1";
"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1";
"65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2";
"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2";
"67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0";
"68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0";
"69 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_0";
"70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0";
"71 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_1";
"72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0";
"73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0";
"74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0";
"75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0";
"76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1";
"78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3";
"79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0";
"80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3";
"81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0";
"86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0";
"87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1";
"103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0";
"104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0";
"108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0";
"109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0";
"110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1";
"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1";
"112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2";
"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2";
"114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0";
"115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0";
"116 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_0";
"117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0";
"118 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_1";
"119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0";
"120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0";
"121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0";
"122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0";
"123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1";
"125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3";
"126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0";
"127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3";
"128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0";
"133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0";
"134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1";
"150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0";
"151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0";
"155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0";
"156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0";
"157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1";
"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1";
"159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2";
"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2";
"161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0";
"162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0";
"163 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_0";
"164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0";
"165 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_1";
"166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0";
"167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0";
"168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0";
"169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0";
"170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1";
"172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3";
"173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0";
"174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3";
"175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0";
"180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0";
"181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1";
"197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0";
"198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0";
"202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0";
"203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0";
"204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1";
"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1";
"206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2";
"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2";
"208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0";
"209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0";
"210 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_0";
"211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0";
"212 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_1";
"213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0";
"214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0";
"215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0";
"216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0";
"217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1";
"219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3";
"220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0";
"221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3";
"222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0";
"227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0";
"228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1";
"244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0";
"245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0";
"249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0";
"250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0";
"251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1";
"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1";
"253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2";
"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2";
"255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0";
"256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0";
"257 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_0";
"258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0";
"259 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_1";
"260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0";
"261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0";
"262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0";
"263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0";
"264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1";
"266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3";
"267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0";
"268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3";
"269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0";
"274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0";
"275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1";
"291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0";
"292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0";
"296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0";
"297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0";
"298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1";
"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1";
"300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2";
"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2";
"302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0";
"303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0";
"304 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_0";
"305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0";
"306 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_1";
"307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0";
"308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0";
"309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0";
"310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0";
"311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1";
"313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3";
"314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0";
"315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3";
"316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0";
"321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0";
"322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1";
"338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0";
"339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0";
"343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0";
"344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0";
"345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1";
"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1";
"347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2";
"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2";
"349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0";
"350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0";
"351 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_0";
"352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0";
"353 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_1";
"354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0";
"355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0";
"356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0";
"357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0";
"358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1";
"360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3";
"361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0";
"362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3";
"363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0";
"368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0";
"369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1";
"385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0";
"386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0";
"390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0";
"391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0";
"392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1";
"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1";
"394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2";
"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2";
"396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0";
"397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0";
"398 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_0";
"399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0";
"400 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_1";
"401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0";
"402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0";
"403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0";
"404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0";
"405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1";
"407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3";
"408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0";
"409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3";
"410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0";
"415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0";
"416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1";
"432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0";
"433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0";
"437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0";
"438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0";
"439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1";
"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1";
"441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2";
"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2";
"443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0";
"444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0";
"445 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_0";
"446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0";
"447 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_1";
"448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0";
"449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0";
"450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0";
"451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0";
"452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1";
"454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3";
"455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0";
"456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3";
"457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0";
"462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0";
"463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1";
"479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0";
"480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0";
"484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0";
"485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0";
"486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1";
"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1";
"488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2";
"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2";
"490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0";
"491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0";
"492 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_0";
"493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0";
"494 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_1";
"495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0";
"496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0";
"497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0";
"498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0";
"499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1";
"501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3";
"502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0";
"503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3";
"504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0";
"509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0";
"510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1";
"526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0";
"527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0";
"528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0";
"529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1";
"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0";
"531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0";
"532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0";
"533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1";
"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1";
"535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2";
"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2";
"537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0";
"538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0";
"539 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_0";
"540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0";
"541 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_1";
"542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0";
"543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0";
"544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0";
"545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0";
"546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0";
"547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1";
"548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3";
"549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0";
"550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3";
"551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0";
"552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0";
"553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1";
"554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0";
"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0";
"556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0";
"557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0";
"558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0";
"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1";
"560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0";
"561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0";
"562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1";
"563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0";
"564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2";
"565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0";
"566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0";
"567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0";
"568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0";
"569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0";
"570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1";
"571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0";
"572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1";
"573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0";
"574 GPT2LMHeadModel/GPT2Model[transformer]/view_2";
"575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0";
"576 /nncf_model_output_0";
"577 /nncf_model_output_1";
"578 /nncf_model_output_2";
"579 /nncf_model_output_3";
"580 /nncf_model_output_4";
"581 /nncf_model_output_5";
"582 /nncf_model_output_6";
"583 /nncf_model_output_7";
"584 /nncf_model_output_8";
"585 /nncf_model_output_9";
"586 /nncf_model_output_10";
"587 /nncf_model_output_11";
"588 /nncf_model_output_12";
"589 /nncf_model_output_13";
"590 /nncf_model_output_14";
"591 /nncf_model_output_15";
"592 /nncf_model_output_16";
"593 /nncf_model_output_17";
"594 /nncf_model_output_18";
"595 /nncf_model_output_19";
"596 /nncf_model_output_20";
"597 /nncf_model_output_21";
"598 /nncf_model_output_22";
"599 /nncf_model_output_23";
"600 /nncf_model_output_24";
"0 /nncf_model_input_0" -> "2 GPT2LMHeadModel/GPT2Model[transformer]/view_0" [label="(8, 1024) \n0 -> 0", style=dashed];
"1 /nncf_model_input_1" -> "3 GPT2LMHeadModel/GPT2Model[transformer]/view_1" [label="(8, 1024) \n0 -> 0", style=dashed];
"2 GPT2LMHeadModel/GPT2Model[transformer]/view_0" -> "5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0" [label="(8, 1024) \n0 -> 0", style=dashed];
"3 GPT2LMHeadModel/GPT2Model[transformer]/view_1" -> "4 GPT2LMHeadModel/GPT2Model[transformer]/__getitem___0" [label="(8, 1024) \n0 -> 0", style=dashed];
"5 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wte]/embedding_0" -> "7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"6 GPT2LMHeadModel/GPT2Model[transformer]/NNCFEmbedding[wpe]/embedding_0" -> "7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" [label="(1, 1024, 768) \n0 -> 1", style=solid];
"7 GPT2LMHeadModel/GPT2Model[transformer]/__add___0" -> "8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" -> "9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"8 GPT2LMHeadModel/GPT2Model[transformer]/Dropout[drop]/dropout_0" -> "38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"9 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"10 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"11 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"12 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"13 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/split_0" -> "18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"14 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_0" -> "15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"15 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_0" -> "21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"16 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_1" -> "17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" -> "20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"17 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_1" -> "576 /nncf_model_output_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"18 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_2" -> "19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" -> "30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"19 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_2" -> "577 /nncf_model_output_1" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"20 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/transpose_0" -> "21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"21 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_0" -> "23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"22 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_0" -> "23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"23 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__truediv___0" -> "25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"24 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/full_1" -> "25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"25 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/where_0" -> "26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"26 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/__add___0" -> "27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"27 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/softmax_0" -> "28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"28 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/type_0" -> "29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"29 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"30 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/matmul_1" -> "31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"31 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/permute_3" -> "32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"32 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/contiguous_0" -> "33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"33 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/view_3" -> "34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"34 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"35 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"36 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"37 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" -> "39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"38 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___0" -> "55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"39 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"40 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"41 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"42 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"43 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"44 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"45 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"46 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"47 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"48 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"49 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"50 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"51 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"52 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"53 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"54 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" -> "56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"55 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[0]/__add___1" -> "85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"56 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"57 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"58 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"59 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"60 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/split_0" -> "65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"61 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_0" -> "62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"62 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_0" -> "68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"63 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_1" -> "64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" -> "67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"64 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_1" -> "578 /nncf_model_output_2" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"65 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_2" -> "66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" -> "77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"66 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_2" -> "579 /nncf_model_output_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"67 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/transpose_0" -> "68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"68 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_0" -> "70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"69 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_0" -> "70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"70 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__truediv___0" -> "72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"71 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/full_1" -> "72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"72 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/where_0" -> "73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"73 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/__add___0" -> "74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"74 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/softmax_0" -> "75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"75 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/type_0" -> "76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"76 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"77 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/matmul_1" -> "78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"78 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/permute_3" -> "79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"79 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/contiguous_0" -> "80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"80 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/view_3" -> "81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"81 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"82 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"83 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"84 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" -> "86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"85 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___0" -> "102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"86 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"87 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"88 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"89 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"90 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"91 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"92 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"93 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"94 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"95 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"96 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"97 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"98 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"99 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"100 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"101 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" -> "103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"102 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[1]/__add___1" -> "132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"103 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"104 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"105 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"106 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"107 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/split_0" -> "112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"108 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_0" -> "109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"109 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_0" -> "115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"110 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_1" -> "111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" -> "114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"111 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_1" -> "580 /nncf_model_output_4" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"112 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_2" -> "113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" -> "124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"113 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_2" -> "581 /nncf_model_output_5" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"114 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/transpose_0" -> "115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"115 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_0" -> "117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"116 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_0" -> "117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"117 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__truediv___0" -> "119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"118 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/full_1" -> "119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"119 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/where_0" -> "120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"120 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/__add___0" -> "121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"121 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/softmax_0" -> "122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"122 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/type_0" -> "123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"123 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"124 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/matmul_1" -> "125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"125 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/permute_3" -> "126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"126 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/contiguous_0" -> "127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"127 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/view_3" -> "128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"128 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"129 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"130 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"131 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" -> "133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"132 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___0" -> "149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"133 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"134 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"135 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"136 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"137 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"138 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"139 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"140 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"141 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"142 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"143 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"144 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"145 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"146 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"147 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"148 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" -> "150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"149 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[2]/__add___1" -> "179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"150 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"151 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"152 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"153 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"154 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/split_0" -> "159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"155 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_0" -> "156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"156 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_0" -> "162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"157 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_1" -> "158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" -> "161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"158 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_1" -> "582 /nncf_model_output_6" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"159 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_2" -> "160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" -> "171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"160 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_2" -> "583 /nncf_model_output_7" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"161 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/transpose_0" -> "162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"162 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_0" -> "164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"163 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_0" -> "164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"164 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__truediv___0" -> "166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"165 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/full_1" -> "166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"166 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/where_0" -> "167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"167 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/__add___0" -> "168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"168 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/softmax_0" -> "169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"169 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/type_0" -> "170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"170 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"171 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/matmul_1" -> "172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"172 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/permute_3" -> "173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"173 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/contiguous_0" -> "174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"174 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/view_3" -> "175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"175 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"176 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"177 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"178 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" -> "180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"179 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___0" -> "196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"180 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"181 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"182 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"183 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"184 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"185 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"186 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"187 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"188 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"189 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"190 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"191 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"192 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"193 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"194 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"195 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" -> "197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"196 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[3]/__add___1" -> "226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"197 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"198 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"199 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"200 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"201 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/split_0" -> "206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"202 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_0" -> "203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"203 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_0" -> "209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"204 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_1" -> "205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" -> "208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"205 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_1" -> "584 /nncf_model_output_8" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"206 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_2" -> "207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" -> "218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"207 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_2" -> "585 /nncf_model_output_9" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"208 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/transpose_0" -> "209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"209 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_0" -> "211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"210 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_0" -> "211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"211 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__truediv___0" -> "213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"212 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/full_1" -> "213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"213 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/where_0" -> "214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"214 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/__add___0" -> "215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"215 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/softmax_0" -> "216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"216 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/type_0" -> "217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"217 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"218 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/matmul_1" -> "219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"219 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/permute_3" -> "220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"220 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/contiguous_0" -> "221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"221 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/view_3" -> "222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"222 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"223 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"224 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"225 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" -> "227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"226 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___0" -> "243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"227 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"228 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"229 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"230 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"231 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"232 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"233 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"234 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"235 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"236 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"237 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"238 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"239 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"240 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"241 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"242 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" -> "244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"243 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[4]/__add___1" -> "273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"244 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"245 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"246 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"247 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"248 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/split_0" -> "253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"249 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_0" -> "250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"250 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_0" -> "256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"251 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_1" -> "252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" -> "255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"252 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_1" -> "586 /nncf_model_output_10" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"253 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_2" -> "254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" -> "265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"254 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_2" -> "587 /nncf_model_output_11" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"255 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/transpose_0" -> "256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"256 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_0" -> "258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"257 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_0" -> "258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"258 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__truediv___0" -> "260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"259 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/full_1" -> "260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"260 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/where_0" -> "261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"261 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/__add___0" -> "262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"262 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/softmax_0" -> "263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"263 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/type_0" -> "264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"264 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"265 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/matmul_1" -> "266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"266 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/permute_3" -> "267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"267 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/contiguous_0" -> "268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"268 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/view_3" -> "269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"269 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"270 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"271 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"272 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" -> "274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"273 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___0" -> "290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"274 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"275 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"276 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"277 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"278 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"279 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"280 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"281 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"282 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"283 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"284 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"285 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"286 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"287 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"288 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"289 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" -> "291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"290 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[5]/__add___1" -> "320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"291 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"292 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"293 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"294 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"295 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/split_0" -> "300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"296 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_0" -> "297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"297 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_0" -> "303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"298 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_1" -> "299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" -> "302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"299 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_1" -> "588 /nncf_model_output_12" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"300 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_2" -> "301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" -> "312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"301 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_2" -> "589 /nncf_model_output_13" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"302 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/transpose_0" -> "303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"303 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_0" -> "305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"304 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_0" -> "305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"305 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__truediv___0" -> "307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"306 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/full_1" -> "307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"307 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/where_0" -> "308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"308 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/__add___0" -> "309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"309 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/softmax_0" -> "310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"310 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/type_0" -> "311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"311 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"312 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/matmul_1" -> "313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"313 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/permute_3" -> "314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"314 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/contiguous_0" -> "315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"315 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/view_3" -> "316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"316 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"317 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"318 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"319 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" -> "321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"320 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___0" -> "337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"321 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"322 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"323 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"324 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"325 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"326 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"327 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"328 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"329 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"330 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"331 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"332 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"333 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"334 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"335 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"336 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" -> "338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"337 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[6]/__add___1" -> "367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"338 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"339 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"340 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"341 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"342 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/split_0" -> "347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"343 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_0" -> "344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"344 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_0" -> "350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"345 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_1" -> "346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" -> "349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"346 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_1" -> "590 /nncf_model_output_14" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"347 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_2" -> "348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" -> "359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"348 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_2" -> "591 /nncf_model_output_15" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"349 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/transpose_0" -> "350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"350 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_0" -> "352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"351 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_0" -> "352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"352 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__truediv___0" -> "354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"353 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/full_1" -> "354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"354 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/where_0" -> "355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"355 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/__add___0" -> "356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"356 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/softmax_0" -> "357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"357 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/type_0" -> "358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"358 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"359 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/matmul_1" -> "360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"360 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/permute_3" -> "361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"361 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/contiguous_0" -> "362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"362 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/view_3" -> "363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"363 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"364 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"365 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"366 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" -> "368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"367 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___0" -> "384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"368 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"369 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"370 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"371 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"372 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"373 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"374 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"375 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"376 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"377 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"378 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"379 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"380 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"381 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"382 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"383 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" -> "385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"384 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[7]/__add___1" -> "414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"385 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"386 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"387 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"388 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"389 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/split_0" -> "394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"390 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_0" -> "391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"391 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_0" -> "397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"392 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_1" -> "393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" -> "396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"393 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_1" -> "592 /nncf_model_output_16" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"394 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_2" -> "395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" -> "406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"395 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_2" -> "593 /nncf_model_output_17" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"396 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/transpose_0" -> "397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"397 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_0" -> "399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"398 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_0" -> "399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"399 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__truediv___0" -> "401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"400 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/full_1" -> "401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"401 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/where_0" -> "402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"402 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/__add___0" -> "403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"403 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/softmax_0" -> "404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"404 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/type_0" -> "405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"405 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"406 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/matmul_1" -> "407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"407 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/permute_3" -> "408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"408 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/contiguous_0" -> "409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"409 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/view_3" -> "410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"410 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"411 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"412 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"413 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" -> "415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"414 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___0" -> "431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"415 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"416 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"417 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"418 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"419 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"420 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"421 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"422 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"423 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"424 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"425 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"426 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"427 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"428 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"429 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"430 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" -> "432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"431 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[8]/__add___1" -> "461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"432 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"433 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"434 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"435 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"436 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/split_0" -> "441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"437 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_0" -> "438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"438 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_0" -> "444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"439 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_1" -> "440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" -> "443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"440 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_1" -> "594 /nncf_model_output_18" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"441 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_2" -> "442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" -> "453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"442 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_2" -> "595 /nncf_model_output_19" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"443 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/transpose_0" -> "444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"444 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_0" -> "446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"445 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_0" -> "446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"446 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__truediv___0" -> "448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"447 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/full_1" -> "448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"448 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/where_0" -> "449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"449 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/__add___0" -> "450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"450 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/softmax_0" -> "451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"451 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/type_0" -> "452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"452 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"453 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/matmul_1" -> "454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"454 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/permute_3" -> "455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"455 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/contiguous_0" -> "456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"456 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/view_3" -> "457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"457 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"458 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"459 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"460 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" -> "462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"461 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___0" -> "478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"462 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"463 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"464 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"465 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"466 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"467 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"468 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"469 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"470 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"471 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"472 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"473 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"474 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"475 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"476 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"477 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" -> "479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"478 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[9]/__add___1" -> "508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"479 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"480 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"481 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"482 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"483 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/split_0" -> "488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"484 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_0" -> "485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"485 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_0" -> "491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"486 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_1" -> "487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" -> "490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"487 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_1" -> "596 /nncf_model_output_20" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"488 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_2" -> "489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" -> "500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"489 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_2" -> "597 /nncf_model_output_21" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"490 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/transpose_0" -> "491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"491 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_0" -> "493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"492 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_0" -> "493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"493 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__truediv___0" -> "495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"494 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/full_1" -> "495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"495 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/where_0" -> "496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"496 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/__add___0" -> "497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"497 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/softmax_0" -> "498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"498 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/type_0" -> "499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"499 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"500 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/matmul_1" -> "501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"501 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/permute_3" -> "502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"502 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/contiguous_0" -> "503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"503 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/view_3" -> "504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"504 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"505 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"506 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"507 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" -> "509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"508 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___0" -> "525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"509 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"510 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"511 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"512 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"513 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"514 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"515 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"516 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"517 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"518 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"519 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"520 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"521 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"522 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"523 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"524 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" -> "526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"525 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[10]/__add___1" -> "555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"526 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_1]/layer_norm_0" -> "527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"527 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_0" -> "528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"528 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/addmm_0" -> "529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" [label="(8192, 2304) \n0 -> 0", style=solid];
"529 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_attn]/view_1" -> "530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" [label="(8, 1024, 2304) \n0 -> 0", style=solid];
"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1" [label="(8, 1024, 768) \n1 -> 0", style=solid];
"530 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/split_0" -> "535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2" [label="(8, 1024, 768) \n2 -> 0", style=solid];
"531 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_0" -> "532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"532 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_0" -> "538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"533 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_1" -> "534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" -> "537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"534 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_1" -> "598 /nncf_model_output_22" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"535 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_2" -> "536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" -> "547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 64) \n0 -> 1", style=solid];
"536 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_2" -> "599 /nncf_model_output_23" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"537 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/transpose_0" -> "538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" [label="(8, 12, 64, 1024) \n0 -> 1", style=solid];
"538 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_0" -> "540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"539 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_0" -> "540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" [label="() \n0 -> 1", style=solid];
"540 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__truediv___0" -> "542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" [label="(8, 12, 1024, 1024) \n0 -> 1", style=solid];
"541 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/full_1" -> "542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" [label="() \n0 -> 2", style=solid];
"542 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/where_0" -> "543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"543 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/__add___0" -> "544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"544 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/softmax_0" -> "545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"545 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/type_0" -> "546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"546 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[attn_dropout]/dropout_0" -> "547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" [label="(8, 12, 1024, 1024) \n0 -> 0", style=solid];
"547 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/matmul_1" -> "548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3" [label="(8, 12, 1024, 64) \n0 -> 0", style=solid];
"548 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/permute_3" -> "549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"549 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/contiguous_0" -> "550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3" [label="(8, 1024, 12, 64) \n0 -> 0", style=solid];
"550 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/view_3" -> "551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"551 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_0" -> "552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"552 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/addmm_0" -> "553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"553 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Conv1D[c_proj]/view_1" -> "554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"554 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2Attention[attn]/Dropout[resid_dropout]/dropout_0" -> "555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" -> "556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"555 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___0" -> "572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"556 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/NNCFLayerNorm[ln_2]/layer_norm_0" -> "557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"557 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_0" -> "558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" [label="(8192, 768) \n0 -> 1", style=solid];
"558 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/addmm_0" -> "559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" [label="(8192, 3072) \n0 -> 0", style=solid];
"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"559 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_fc]/view_1" -> "563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"560 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___0" -> "567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"561 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/pow_0" -> "562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"562 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___1" -> "563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"563 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__add___0" -> "564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"564 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__rmul___2" -> "565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"565 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/tanh_0" -> "566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"566 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__radd___0" -> "567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" [label="(8, 1024, 3072) \n0 -> 1", style=solid];
"567 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/NewGELUActivation[act]/__mul___0" -> "568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" [label="(8, 1024, 3072) \n0 -> 0", style=solid];
"568 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_0" -> "569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" [label="(8192, 3072) \n0 -> 1", style=solid];
"569 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/addmm_0" -> "570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" [label="(8192, 768) \n0 -> 0", style=solid];
"570 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Conv1D[c_proj]/view_1" -> "571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"571 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/GPT2MLP[mlp]/Dropout[dropout]/dropout_0" -> "572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" [label="(8, 1024, 768) \n0 -> 1", style=solid];
"572 GPT2LMHeadModel/GPT2Model[transformer]/ModuleList[h]/GPT2Block[11]/__add___1" -> "573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"573 GPT2LMHeadModel/GPT2Model[transformer]/NNCFLayerNorm[ln_f]/layer_norm_0" -> "574 GPT2LMHeadModel/GPT2Model[transformer]/view_2" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"574 GPT2LMHeadModel/GPT2Model[transformer]/view_2" -> "575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0" [label="(8, 1024, 768) \n0 -> 0", style=solid];
"575 GPT2LMHeadModel/NNCFLinear[lm_head]/linear_0" -> "600 /nncf_model_output_24" [label="(8, 1024, 50257) \n0 -> 0", style=solid];
}