karamjotsingh commited on
Commit
8103ccd
·
verified ·
1 Parent(s): b174e81

Upload position_ids_debug.ipynb with huggingface_hub

Browse files
Files changed (1) hide show
  1. position_ids_debug.ipynb +77 -48
position_ids_debug.ipynb CHANGED
@@ -2,23 +2,22 @@
2
  "cells": [
3
  {
4
  "cell_type": "code",
5
- "execution_count": 1,
6
  "id": "6511a91c-ed20-41ff-befb-699bda1912a3",
7
  "metadata": {
8
  "execution": {
9
- "iopub.execute_input": "2026-03-25T05:42:29.023013Z",
10
- "iopub.status.busy": "2026-03-25T05:42:29.022863Z",
11
- "iopub.status.idle": "2026-03-25T05:42:40.880280Z",
12
- "shell.execute_reply": "2026-03-25T05:42:40.879248Z",
13
- "shell.execute_reply.started": "2026-03-25T05:42:29.022998Z"
14
- },
15
- "scrolled": true
16
  },
17
  "outputs": [
18
  {
19
  "data": {
20
  "application/vnd.jupyter.widget-view+json": {
21
- "model_id": "8310548c3b0d460899adcb96ee4af2e1",
22
  "version_major": 2,
23
  "version_minor": 0
24
  },
@@ -32,7 +31,7 @@
32
  {
33
  "data": {
34
  "application/vnd.jupyter.widget-view+json": {
35
- "model_id": "663ea1161c934235a53948b93d224495",
36
  "version_major": 2,
37
  "version_minor": 0
38
  },
@@ -46,7 +45,7 @@
46
  {
47
  "data": {
48
  "application/vnd.jupyter.widget-view+json": {
49
- "model_id": "667df34dda224931ac9ccd442a5d42f0",
50
  "version_major": 2,
51
  "version_minor": 0
52
  },
@@ -79,24 +78,9 @@
79
  " batch 0 (shape: 94):\n",
80
  " t: [0, 1, 2, 3, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n",
81
  " h: [0, 1, 2, 3, 4, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10, 10, 10, 10, 10, 10, 11, 11, 11, 11, 11, 11, 11, 11, 11, 12, 12, 12, 12, 12, 12, 12, 12, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n",
82
- " w: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n"
83
- ]
84
- },
85
- {
86
- "ename": "SystemExit",
87
- "evalue": "Debugging: Terminate after 1st decoder saved cos and sin tensors.",
88
- "output_type": "error",
89
- "traceback": [
90
- "An exception has occurred, use %tb to see the full traceback.\n",
91
- "\u001b[31mSystemExit\u001b[39m\u001b[31m:\u001b[39m Debugging: Terminate after 1st decoder saved cos and sin tensors.\n"
92
- ]
93
- },
94
- {
95
- "name": "stderr",
96
- "output_type": "stream",
97
- "text": [
98
- "/home/ubuntu/miniconda3/envs/dc_airnd/lib/python3.12/site-packages/IPython/core/interactiveshell.py:3755: UserWarning: To exit: use 'exit', 'quit', or Ctrl-D.\n",
99
- " warn(\"To exit: use 'exit', 'quit', or Ctrl-D.\", stacklevel=1)\n"
100
  ]
101
  }
102
  ],
@@ -163,11 +147,11 @@
163
  "id": "f45df021-6302-4f47-9e06-8070577885a2",
164
  "metadata": {
165
  "execution": {
166
- "iopub.execute_input": "2026-03-25T04:36:13.766580Z",
167
- "iopub.status.busy": "2026-03-25T04:36:13.766400Z",
168
- "iopub.status.idle": "2026-03-25T04:36:13.770145Z",
169
- "shell.execute_reply": "2026-03-25T04:36:13.769588Z",
170
- "shell.execute_reply.started": "2026-03-25T04:36:13.766563Z"
171
  }
172
  },
173
  "outputs": [
@@ -188,15 +172,15 @@
188
  },
189
  {
190
  "cell_type": "code",
191
- "execution_count": 2,
192
  "id": "504fa71b-42b4-4f53-8988-25fcfba38d13",
193
  "metadata": {
194
  "execution": {
195
- "iopub.execute_input": "2026-03-25T05:43:53.839325Z",
196
- "iopub.status.busy": "2026-03-25T05:43:53.839044Z",
197
- "iopub.status.idle": "2026-03-25T05:43:53.843214Z",
198
- "shell.execute_reply": "2026-03-25T05:43:53.842555Z",
199
- "shell.execute_reply.started": "2026-03-25T05:43:53.839304Z"
200
  }
201
  },
202
  "outputs": [],
@@ -206,15 +190,15 @@
206
  },
207
  {
208
  "cell_type": "code",
209
- "execution_count": 3,
210
  "id": "642d9dcf-e591-4d70-96af-b69bf955d9e1",
211
  "metadata": {
212
  "execution": {
213
- "iopub.execute_input": "2026-03-25T05:43:54.296041Z",
214
- "iopub.status.busy": "2026-03-25T05:43:54.295869Z",
215
- "iopub.status.idle": "2026-03-25T05:43:54.299276Z",
216
- "shell.execute_reply": "2026-03-25T05:43:54.298634Z",
217
- "shell.execute_reply.started": "2026-03-25T05:43:54.296029Z"
218
  }
219
  },
220
  "outputs": [
@@ -224,7 +208,7 @@
224
  "(torch.Size([1, 1, 94, 128]), torch.float16)"
225
  ]
226
  },
227
- "execution_count": 3,
228
  "metadata": {},
229
  "output_type": "execute_result"
230
  }
@@ -235,8 +219,53 @@
235
  },
236
  {
237
  "cell_type": "code",
238
- "execution_count": null,
239
  "id": "f44460e3-58e9-4fd2-898a-06e8a00f9365",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
240
  "metadata": {},
241
  "outputs": [],
242
  "source": []
 
2
  "cells": [
3
  {
4
  "cell_type": "code",
5
+ "execution_count": 3,
6
  "id": "6511a91c-ed20-41ff-befb-699bda1912a3",
7
  "metadata": {
8
  "execution": {
9
+ "iopub.execute_input": "2026-03-25T05:56:03.439346Z",
10
+ "iopub.status.busy": "2026-03-25T05:56:03.439077Z",
11
+ "iopub.status.idle": "2026-03-25T05:56:12.533462Z",
12
+ "shell.execute_reply": "2026-03-25T05:56:12.532731Z",
13
+ "shell.execute_reply.started": "2026-03-25T05:56:03.439327Z"
14
+ }
 
15
  },
16
  "outputs": [
17
  {
18
  "data": {
19
  "application/vnd.jupyter.widget-view+json": {
20
+ "model_id": "4655d86aa4f24755a2a3a230298174ac",
21
  "version_major": 2,
22
  "version_minor": 0
23
  },
 
31
  {
32
  "data": {
33
  "application/vnd.jupyter.widget-view+json": {
34
+ "model_id": "b7f679f3d8a64e01a015d59e7bc7f07e",
35
  "version_major": 2,
36
  "version_minor": 0
37
  },
 
45
  {
46
  "data": {
47
  "application/vnd.jupyter.widget-view+json": {
48
+ "model_id": "1c0c55230de542548486cd47b87fa2a8",
49
  "version_major": 2,
50
  "version_minor": 0
51
  },
 
78
  " batch 0 (shape: 94):\n",
79
  " t: [0, 1, 2, 3, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n",
80
  " h: [0, 1, 2, 3, 4, 4, 4, 4, 4, 4, 4, 4, 4, 5, 5, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 6, 6, 6, 6, 6, 7, 7, 7, 7, 7, 7, 7, 7, 7, 8, 8, 8, 8, 8, 8, 8, 8, 8, 9, 9, 9, 9, 9, 9, 9, 9, 9, 10, 10, 10, 10, 10, 10, 10, 10, 10, 11, 11, 11, 11, 11, 11, 11, 11, 11, 12, 12, 12, 12, 12, 12, 12, 12, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n",
81
+ " w: [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21] \n",
82
+ "\n",
83
+ "Manual Prompt Response: The image shows a black Porsche Panamera parked on a road. The car is positioned at an angle, with the rear of the vehicle facing the camera. The Porsche logo and model name are visible on the trunk. The car has a sleek design with a long hood and short rear deck. The taillights are prominent, and the license plate is clearly visible. The background appears to be a blurred landscape, suggesting motion or a focus on the car itself.\n"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84
  ]
85
  }
86
  ],
 
147
  "id": "f45df021-6302-4f47-9e06-8070577885a2",
148
  "metadata": {
149
  "execution": {
150
+ "iopub.execute_input": "2026-03-25T05:56:12.534299Z",
151
+ "iopub.status.busy": "2026-03-25T05:56:12.534123Z",
152
+ "iopub.status.idle": "2026-03-25T05:56:12.537469Z",
153
+ "shell.execute_reply": "2026-03-25T05:56:12.536915Z",
154
+ "shell.execute_reply.started": "2026-03-25T05:56:12.534284Z"
155
  }
156
  },
157
  "outputs": [
 
172
  },
173
  {
174
  "cell_type": "code",
175
+ "execution_count": 5,
176
  "id": "504fa71b-42b4-4f53-8988-25fcfba38d13",
177
  "metadata": {
178
  "execution": {
179
+ "iopub.execute_input": "2026-03-25T05:56:12.538139Z",
180
+ "iopub.status.busy": "2026-03-25T05:56:12.537990Z",
181
+ "iopub.status.idle": "2026-03-25T05:56:12.549445Z",
182
+ "shell.execute_reply": "2026-03-25T05:56:12.548820Z",
183
+ "shell.execute_reply.started": "2026-03-25T05:56:12.538125Z"
184
  }
185
  },
186
  "outputs": [],
 
190
  },
191
  {
192
  "cell_type": "code",
193
+ "execution_count": 6,
194
  "id": "642d9dcf-e591-4d70-96af-b69bf955d9e1",
195
  "metadata": {
196
  "execution": {
197
+ "iopub.execute_input": "2026-03-25T05:56:12.549936Z",
198
+ "iopub.status.busy": "2026-03-25T05:56:12.549800Z",
199
+ "iopub.status.idle": "2026-03-25T05:56:12.558625Z",
200
+ "shell.execute_reply": "2026-03-25T05:56:12.557969Z",
201
+ "shell.execute_reply.started": "2026-03-25T05:56:12.549924Z"
202
  }
203
  },
204
  "outputs": [
 
208
  "(torch.Size([1, 1, 94, 128]), torch.float16)"
209
  ]
210
  },
211
+ "execution_count": 6,
212
  "metadata": {},
213
  "output_type": "execute_result"
214
  }
 
219
  },
220
  {
221
  "cell_type": "code",
222
+ "execution_count": 14,
223
  "id": "f44460e3-58e9-4fd2-898a-06e8a00f9365",
224
+ "metadata": {
225
+ "execution": {
226
+ "iopub.execute_input": "2026-03-25T06:04:09.103843Z",
227
+ "iopub.status.busy": "2026-03-25T06:04:09.103513Z",
228
+ "iopub.status.idle": "2026-03-25T06:04:09.110953Z",
229
+ "shell.execute_reply": "2026-03-25T06:04:09.110385Z",
230
+ "shell.execute_reply.started": "2026-03-25T06:04:09.103826Z"
231
+ }
232
+ },
233
+ "outputs": [
234
+ {
235
+ "data": {
236
+ "text/plain": [
237
+ "tensor([[[0.5405, 0.6924, 0.7964, 0.8662, 0.9126, 0.9429, 0.9629, 0.9756,\n",
238
+ " 0.9844, 0.9897, 0.9932, 0.9956, 0.9971, 0.9980, 0.9990, 0.9990,\n",
239
+ " 0.9995, 0.9995, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
240
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
241
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
242
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
243
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
244
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
245
+ " 0.5405, 0.6924, 0.7964, 0.8662, 0.9126, 0.9429, 0.9629, 0.9756,\n",
246
+ " 0.9844, 0.9897, 0.9932, 0.9956, 0.9971, 0.9980, 0.9990, 0.9990,\n",
247
+ " 0.9995, 0.9995, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
248
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
249
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
250
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
251
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000,\n",
252
+ " 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000, 1.0000]]],\n",
253
+ " device='cuda:0', dtype=torch.float16)"
254
+ ]
255
+ },
256
+ "execution_count": 14,
257
+ "metadata": {},
258
+ "output_type": "execute_result"
259
+ }
260
+ ],
261
+ "source": [
262
+ "cos[:, :, 1, :]"
263
+ ]
264
+ },
265
+ {
266
+ "cell_type": "code",
267
+ "execution_count": null,
268
+ "id": "039f1456-ffa4-40b2-8ba1-a0cd5f74733e",
269
  "metadata": {},
270
  "outputs": [],
271
  "source": []