|
32 | 32 | {
|
33 | 33 | "cell_type": "code",
|
34 | 34 | "execution_count": null,
|
35 |
| - "metadata": { |
36 |
| - "execution": { |
37 |
| - "iopub.execute_input": "2024-11-07T18:44:42.063503Z", |
38 |
| - "iopub.status.busy": "2024-11-07T18:44:42.063379Z", |
39 |
| - "iopub.status.idle": "2024-11-07T18:45:07.255300Z", |
40 |
| - "shell.execute_reply": "2024-11-07T18:45:07.254547Z" |
41 |
| - } |
42 |
| - }, |
| 35 | + "metadata": {}, |
43 | 36 | "outputs": [],
|
44 | 37 | "source": [
|
45 | 38 | "from sglang.utils import (\n",
|
|
71 | 64 | {
|
72 | 65 | "cell_type": "code",
|
73 | 66 | "execution_count": null,
|
74 |
| - "metadata": { |
75 |
| - "execution": { |
76 |
| - "iopub.execute_input": "2024-11-07T18:45:07.258292Z", |
77 |
| - "iopub.status.busy": "2024-11-07T18:45:07.257710Z", |
78 |
| - "iopub.status.idle": "2024-11-07T18:45:07.611559Z", |
79 |
| - "shell.execute_reply": "2024-11-07T18:45:07.610842Z" |
80 |
| - } |
81 |
| - }, |
| 67 | + "metadata": {}, |
82 | 68 | "outputs": [],
|
83 | 69 | "source": [
|
84 | 70 | "url = \"http://localhost:30010/generate\"\n",
|
|
99 | 85 | {
|
100 | 86 | "cell_type": "code",
|
101 | 87 | "execution_count": null,
|
102 |
| - "metadata": { |
103 |
| - "execution": { |
104 |
| - "iopub.execute_input": "2024-11-07T18:45:07.613911Z", |
105 |
| - "iopub.status.busy": "2024-11-07T18:45:07.613746Z", |
106 |
| - "iopub.status.idle": "2024-11-07T18:45:07.620286Z", |
107 |
| - "shell.execute_reply": "2024-11-07T18:45:07.619779Z" |
108 |
| - } |
109 |
| - }, |
| 88 | + "metadata": {}, |
110 | 89 | "outputs": [],
|
111 | 90 | "source": [
|
112 | 91 | "url = \"http://localhost:30010/get_server_args\"\n",
|
|
130 | 109 | {
|
131 | 110 | "cell_type": "code",
|
132 | 111 | "execution_count": null,
|
133 |
| - "metadata": { |
134 |
| - "execution": { |
135 |
| - "iopub.execute_input": "2024-11-07T18:45:07.622407Z", |
136 |
| - "iopub.status.busy": "2024-11-07T18:45:07.622267Z", |
137 |
| - "iopub.status.idle": "2024-11-07T18:45:07.628290Z", |
138 |
| - "shell.execute_reply": "2024-11-07T18:45:07.627793Z" |
139 |
| - } |
140 |
| - }, |
| 112 | + "metadata": {}, |
141 | 113 | "outputs": [],
|
142 | 114 | "source": [
|
143 | 115 | "url = \"http://localhost:30010/get_model_info\"\n",
|
|
162 | 134 | {
|
163 | 135 | "cell_type": "code",
|
164 | 136 | "execution_count": null,
|
165 |
| - "metadata": { |
166 |
| - "execution": { |
167 |
| - "iopub.execute_input": "2024-11-07T18:45:07.630585Z", |
168 |
| - "iopub.status.busy": "2024-11-07T18:45:07.630235Z", |
169 |
| - "iopub.status.idle": "2024-11-07T18:45:07.643498Z", |
170 |
| - "shell.execute_reply": "2024-11-07T18:45:07.643007Z" |
171 |
| - } |
172 |
| - }, |
| 137 | + "metadata": {}, |
173 | 138 | "outputs": [],
|
174 | 139 | "source": [
|
175 | 140 | "url = \"http://localhost:30010/health_generate\"\n",
|
|
181 | 146 | {
|
182 | 147 | "cell_type": "code",
|
183 | 148 | "execution_count": null,
|
184 |
| - "metadata": { |
185 |
| - "execution": { |
186 |
| - "iopub.execute_input": "2024-11-07T18:45:07.645336Z", |
187 |
| - "iopub.status.busy": "2024-11-07T18:45:07.645196Z", |
188 |
| - "iopub.status.idle": "2024-11-07T18:45:07.650363Z", |
189 |
| - "shell.execute_reply": "2024-11-07T18:45:07.649837Z" |
190 |
| - } |
191 |
| - }, |
| 149 | + "metadata": {}, |
192 | 150 | "outputs": [],
|
193 | 151 | "source": [
|
194 | 152 | "url = \"http://localhost:30010/health\"\n",
|
|
209 | 167 | {
|
210 | 168 | "cell_type": "code",
|
211 | 169 | "execution_count": null,
|
212 |
| - "metadata": { |
213 |
| - "execution": { |
214 |
| - "iopub.execute_input": "2024-11-07T18:45:07.652212Z", |
215 |
| - "iopub.status.busy": "2024-11-07T18:45:07.652076Z", |
216 |
| - "iopub.status.idle": "2024-11-07T18:45:07.658633Z", |
217 |
| - "shell.execute_reply": "2024-11-07T18:45:07.658119Z" |
218 |
| - } |
219 |
| - }, |
| 170 | + "metadata": {}, |
220 | 171 | "outputs": [],
|
221 | 172 | "source": [
|
222 | 173 | "# flush cache\n",
|
|
239 | 190 | {
|
240 | 191 | "cell_type": "code",
|
241 | 192 | "execution_count": null,
|
242 |
| - "metadata": { |
243 |
| - "execution": { |
244 |
| - "iopub.execute_input": "2024-11-07T18:45:07.660468Z", |
245 |
| - "iopub.status.busy": "2024-11-07T18:45:07.660325Z", |
246 |
| - "iopub.status.idle": "2024-11-07T18:45:07.666476Z", |
247 |
| - "shell.execute_reply": "2024-11-07T18:45:07.665984Z" |
248 |
| - } |
249 |
| - }, |
| 193 | + "metadata": {}, |
250 | 194 | "outputs": [],
|
251 | 195 | "source": [
|
252 | 196 | "# get_memory_pool_size\n",
|
|
269 | 213 | {
|
270 | 214 | "cell_type": "code",
|
271 | 215 | "execution_count": null,
|
272 |
| - "metadata": { |
273 |
| - "execution": { |
274 |
| - "iopub.execute_input": "2024-11-07T18:45:07.668242Z", |
275 |
| - "iopub.status.busy": "2024-11-07T18:45:07.668108Z", |
276 |
| - "iopub.status.idle": "2024-11-07T18:45:08.725709Z", |
277 |
| - "shell.execute_reply": "2024-11-07T18:45:08.725021Z" |
278 |
| - } |
279 |
| - }, |
| 216 | + "metadata": {}, |
280 | 217 | "outputs": [],
|
281 | 218 | "source": [
|
282 | 219 | "# successful update with same architecture and size\n",
|
|
294 | 231 | {
|
295 | 232 | "cell_type": "code",
|
296 | 233 | "execution_count": null,
|
297 |
| - "metadata": { |
298 |
| - "execution": { |
299 |
| - "iopub.execute_input": "2024-11-07T18:45:08.727865Z", |
300 |
| - "iopub.status.busy": "2024-11-07T18:45:08.727721Z", |
301 |
| - "iopub.status.idle": "2024-11-07T18:45:11.165841Z", |
302 |
| - "shell.execute_reply": "2024-11-07T18:45:11.165282Z" |
303 |
| - } |
304 |
| - }, |
| 234 | + "metadata": {}, |
305 | 235 | "outputs": [],
|
306 | 236 | "source": [
|
307 | 237 | "# failed update with different parameter size\n",
|
|
333 | 263 | {
|
334 | 264 | "cell_type": "code",
|
335 | 265 | "execution_count": null,
|
336 |
| - "metadata": { |
337 |
| - "execution": { |
338 |
| - "iopub.execute_input": "2024-11-07T18:45:11.167853Z", |
339 |
| - "iopub.status.busy": "2024-11-07T18:45:11.167711Z", |
340 |
| - "iopub.status.idle": "2024-11-07T18:45:39.542988Z", |
341 |
| - "shell.execute_reply": "2024-11-07T18:45:39.542135Z" |
342 |
| - } |
343 |
| - }, |
| 266 | + "metadata": {}, |
344 | 267 | "outputs": [],
|
345 | 268 | "source": [
|
346 | 269 | "terminate_process(server_process)\n",
|
|
358 | 281 | {
|
359 | 282 | "cell_type": "code",
|
360 | 283 | "execution_count": null,
|
361 |
| - "metadata": { |
362 |
| - "execution": { |
363 |
| - "iopub.execute_input": "2024-11-07T18:45:39.545416Z", |
364 |
| - "iopub.status.busy": "2024-11-07T18:45:39.545005Z", |
365 |
| - "iopub.status.idle": "2024-11-07T18:45:39.588793Z", |
366 |
| - "shell.execute_reply": "2024-11-07T18:45:39.588054Z" |
367 |
| - } |
368 |
| - }, |
| 284 | + "metadata": {}, |
369 | 285 | "outputs": [],
|
370 | 286 | "source": [
|
371 | 287 | "# successful encode for embedding model\n",
|
|
390 | 306 | {
|
391 | 307 | "cell_type": "code",
|
392 | 308 | "execution_count": null,
|
393 |
| - "metadata": { |
394 |
| - "execution": { |
395 |
| - "iopub.execute_input": "2024-11-07T18:45:39.590729Z", |
396 |
| - "iopub.status.busy": "2024-11-07T18:45:39.590446Z", |
397 |
| - "iopub.status.idle": "2024-11-07T18:45:59.660376Z", |
398 |
| - "shell.execute_reply": "2024-11-07T18:45:59.659992Z" |
399 |
| - } |
400 |
| - }, |
| 309 | + "metadata": {}, |
401 | 310 | "outputs": [],
|
402 | 311 | "source": [
|
403 | 312 | "terminate_process(embedding_process)\n",
|
|
417 | 326 | {
|
418 | 327 | "cell_type": "code",
|
419 | 328 | "execution_count": null,
|
420 |
| - "metadata": { |
421 |
| - "execution": { |
422 |
| - "iopub.execute_input": "2024-11-07T18:45:59.661779Z", |
423 |
| - "iopub.status.busy": "2024-11-07T18:45:59.661641Z", |
424 |
| - "iopub.status.idle": "2024-11-07T18:46:00.475726Z", |
425 |
| - "shell.execute_reply": "2024-11-07T18:46:00.475269Z" |
426 |
| - } |
427 |
| - }, |
| 329 | + "metadata": {}, |
428 | 330 | "outputs": [],
|
429 | 331 | "source": [
|
430 | 332 | "from transformers import AutoTokenizer\n",
|
|
454 | 356 | },
|
455 | 357 | {
|
456 | 358 | "cell_type": "code",
|
457 |
| - "execution_count": 15, |
458 |
| - "metadata": { |
459 |
| - "execution": { |
460 |
| - "iopub.execute_input": "2024-11-07T18:46:00.477283Z", |
461 |
| - "iopub.status.busy": "2024-11-07T18:46:00.477025Z", |
462 |
| - "iopub.status.idle": "2024-11-07T18:46:00.525758Z", |
463 |
| - "shell.execute_reply": "2024-11-07T18:46:00.525236Z" |
464 |
| - } |
465 |
| - }, |
| 359 | + "execution_count": null, |
| 360 | + "metadata": {}, |
466 | 361 | "outputs": [],
|
467 | 362 | "source": [
|
468 | 363 | "terminate_process(reward_process)"
|
469 | 364 | ]
|
470 | 365 | }
|
471 | 366 | ],
|
472 | 367 | "metadata": {
|
473 |
| - "kernelspec": { |
474 |
| - "display_name": "AlphaMeemory", |
475 |
| - "language": "python", |
476 |
| - "name": "python3" |
477 |
| - }, |
478 | 368 | "language_info": {
|
479 | 369 | "codemirror_mode": {
|
480 | 370 | "name": "ipython",
|
|
484 | 374 | "mimetype": "text/x-python",
|
485 | 375 | "name": "python",
|
486 | 376 | "nbconvert_exporter": "python",
|
487 |
| - "pygments_lexer": "ipython3", |
488 |
| - "version": "3.11.7" |
| 377 | + "pygments_lexer": "ipython3" |
489 | 378 | }
|
490 | 379 | },
|
491 | 380 | "nbformat": 4,
|
|
0 commit comments