Skip to content

Commit 655080a

Browse files
committed
Update 2025-10-06 04:23:10
1 parent 574073e commit 655080a

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

43 files changed

+5079
-5193
lines changed

_sources/advanced_features/lora.ipynb

Lines changed: 154 additions & 150 deletions
Large diffs are not rendered by default.

_sources/advanced_features/separate_reasoning.ipynb

Lines changed: 103 additions & 113 deletions
Large diffs are not rendered by default.

_sources/advanced_features/speculative_decoding.ipynb

Lines changed: 358 additions & 387 deletions
Large diffs are not rendered by default.

_sources/advanced_features/structured_outputs.ipynb

Lines changed: 141 additions & 140 deletions
Large diffs are not rendered by default.

_sources/advanced_features/structured_outputs_for_reasoning_models.ipynb

Lines changed: 163 additions & 186 deletions
Large diffs are not rendered by default.

_sources/advanced_features/tool_parser.ipynb

Lines changed: 157 additions & 186 deletions
Large diffs are not rendered by default.

_sources/advanced_features/vlm_query.ipynb

Lines changed: 253 additions & 260 deletions
Large diffs are not rendered by default.

_sources/basic_usage/native_api.ipynb

Lines changed: 146 additions & 158 deletions
Large diffs are not rendered by default.

_sources/basic_usage/offline_engine_api.ipynb

Lines changed: 479 additions & 472 deletions
Large diffs are not rendered by default.

_sources/basic_usage/openai_api_completions.ipynb

Lines changed: 75 additions & 51 deletions
Original file line numberDiff line numberDiff line change
@@ -31,10 +31,10 @@
3131
"execution_count": 1,
3232
"metadata": {
3333
"execution": {
34-
"iopub.execute_input": "2025-10-06T03:37:49.994905Z",
35-
"iopub.status.busy": "2025-10-06T03:37:49.994771Z",
36-
"iopub.status.idle": "2025-10-06T03:38:40.631780Z",
37-
"shell.execute_reply": "2025-10-06T03:38:40.631244Z"
34+
"iopub.execute_input": "2025-10-06T04:19:36.335708Z",
35+
"iopub.status.busy": "2025-10-06T04:19:36.335583Z",
36+
"iopub.status.idle": "2025-10-06T04:20:09.614838Z",
37+
"shell.execute_reply": "2025-10-06T04:20:09.614374Z"
3838
}
3939
},
4040
"outputs": [
@@ -86,7 +86,7 @@
8686
"output_type": "stream",
8787
"text": [
8888
"`torch_dtype` is deprecated! Use `dtype` instead!\n",
89-
"[2025-10-06 03:38:25] `torch_dtype` is deprecated! Use `dtype` instead!\n"
89+
"[2025-10-06 04:19:58] `torch_dtype` is deprecated! Use `dtype` instead!\n"
9090
]
9191
},
9292
{
@@ -97,7 +97,7 @@
9797
"[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0\n",
9898
"[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0\n",
9999
"[Gloo] Rank 0 is connected to 0 peer ranks. Expected number of connected peer ranks is : 0\n",
100-
"[2025-10-06 03:38:29] MOE_RUNNER_BACKEND is not initialized, using triton backend\n"
100+
"[2025-10-06 04:20:00] MOE_RUNNER_BACKEND is not initialized, using triton backend\n"
101101
]
102102
},
103103
{
@@ -107,9 +107,9 @@
107107
"\r",
108108
"Loading safetensors checkpoint shards: 0% Completed | 0/1 [00:00<?, ?it/s]\n",
109109
"\r",
110-
"Loading safetensors checkpoint shards: 100% Completed | 1/1 [00:00<00:00, 6.19it/s]\n",
110+
"Loading safetensors checkpoint shards: 100% Completed | 1/1 [00:00<00:00, 5.92it/s]\n",
111111
"\r",
112-
"Loading safetensors checkpoint shards: 100% Completed | 1/1 [00:00<00:00, 6.18it/s]\n",
112+
"Loading safetensors checkpoint shards: 100% Completed | 1/1 [00:00<00:00, 5.91it/s]\n",
113113
"\n"
114114
]
115115
},
@@ -119,26 +119,18 @@
119119
"text": [
120120
"\r",
121121
" 0%| | 0/3 [00:00<?, ?it/s]\r",
122-
"Capturing batches (bs=4 avail_mem=71.53 GB): 0%| | 0/3 [00:00<?, ?it/s]"
122+
"Capturing batches (bs=4 avail_mem=77.03 GB): 0%| | 0/3 [00:00<?, ?it/s]"
123123
]
124124
},
125125
{
126126
"name": "stdout",
127127
"output_type": "stream",
128128
"text": [
129129
"\r",
130-
"Capturing batches (bs=4 avail_mem=71.53 GB): 33%|███▎ | 1/3 [00:00<00:00, 2.84it/s]\r",
131-
"Capturing batches (bs=2 avail_mem=71.46 GB): 33%|███▎ | 1/3 [00:00<00:00, 2.84it/s]"
132-
]
133-
},
134-
{
135-
"name": "stdout",
136-
"output_type": "stream",
137-
"text": [
138-
"\r",
139-
"Capturing batches (bs=2 avail_mem=71.46 GB): 67%|██████▋ | 2/3 [00:00<00:00, 3.80it/s]\r",
140-
"Capturing batches (bs=1 avail_mem=71.46 GB): 67%|██████▋ | 2/3 [00:00<00:00, 3.80it/s]\r",
141-
"Capturing batches (bs=1 avail_mem=71.46 GB): 100%|██████████| 3/3 [00:00<00:00, 5.01it/s]\n"
130+
"Capturing batches (bs=4 avail_mem=77.03 GB): 33%|███▎ | 1/3 [00:00<00:00, 4.52it/s]\r",
131+
"Capturing batches (bs=2 avail_mem=76.97 GB): 33%|███▎ | 1/3 [00:00<00:00, 4.52it/s]\r",
132+
"Capturing batches (bs=1 avail_mem=76.96 GB): 33%|███▎ | 1/3 [00:00<00:00, 4.52it/s]\r",
133+
"Capturing batches (bs=1 avail_mem=76.96 GB): 100%|██████████| 3/3 [00:00<00:00, 10.68it/s]\n"
142134
]
143135
},
144136
{
@@ -157,7 +149,7 @@
157149
"name": "stdout",
158150
"output_type": "stream",
159151
"text": [
160-
"Server started on http://localhost:30884\n"
152+
"Server started on http://localhost:38621\n"
161153
]
162154
}
163155
],
@@ -191,17 +183,17 @@
191183
"execution_count": 2,
192184
"metadata": {
193185
"execution": {
194-
"iopub.execute_input": "2025-10-06T03:38:40.633900Z",
195-
"iopub.status.busy": "2025-10-06T03:38:40.633563Z",
196-
"iopub.status.idle": "2025-10-06T03:38:40.897940Z",
197-
"shell.execute_reply": "2025-10-06T03:38:40.897465Z"
186+
"iopub.execute_input": "2025-10-06T04:20:09.616535Z",
187+
"iopub.status.busy": "2025-10-06T04:20:09.616213Z",
188+
"iopub.status.idle": "2025-10-06T04:20:09.879343Z",
189+
"shell.execute_reply": "2025-10-06T04:20:09.878902Z"
198190
}
199191
},
200192
"outputs": [
201193
{
202194
"data": {
203195
"text/html": [
204-
"<strong style='color: #00008B;'>Response: ChatCompletion(id='1b89b2c731db480b8715ea001e218847', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content='Sure, here are three countries and their respective capitals:\\n\\n1. **United States** - Washington, D.C.\\n2. **Canada** - Ottawa\\n3. **Australia** - Canberra', refusal=None, role='assistant', annotations=None, audio=None, function_call=None, tool_calls=None, reasoning_content=None), matched_stop=151645)], created=1759721920, model='qwen/qwen2.5-0.5b-instruct', object='chat.completion', service_tier=None, system_fingerprint=None, usage=CompletionUsage(completion_tokens=39, prompt_tokens=37, total_tokens=76, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
196+
"<strong style='color: #00008B;'>Response: ChatCompletion(id='0d37bf86176342649a990e275a02c638', choices=[Choice(finish_reason='stop', index=0, logprobs=None, message=ChatCompletionMessage(content='Sure, here are three countries and their respective capitals:\\n\\n1. **United States** - Washington, D.C.\\n2. **Canada** - Ottawa\\n3. **Australia** - Canberra', refusal=None, role='assistant', annotations=None, audio=None, function_call=None, tool_calls=None, reasoning_content=None), matched_stop=151645)], created=1759724409, model='qwen/qwen2.5-0.5b-instruct', object='chat.completion', service_tier=None, system_fingerprint=None, usage=CompletionUsage(completion_tokens=39, prompt_tokens=37, total_tokens=76, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
205197
],
206198
"text/plain": [
207199
"<IPython.core.display.HTML object>"
@@ -391,17 +383,17 @@
391383
"execution_count": 3,
392384
"metadata": {
393385
"execution": {
394-
"iopub.execute_input": "2025-10-06T03:38:40.899554Z",
395-
"iopub.status.busy": "2025-10-06T03:38:40.899407Z",
396-
"iopub.status.idle": "2025-10-06T03:38:41.150350Z",
397-
"shell.execute_reply": "2025-10-06T03:38:41.149891Z"
386+
"iopub.execute_input": "2025-10-06T04:20:09.880978Z",
387+
"iopub.status.busy": "2025-10-06T04:20:09.880826Z",
388+
"iopub.status.idle": "2025-10-06T04:20:10.096277Z",
389+
"shell.execute_reply": "2025-10-06T04:20:10.095847Z"
398390
}
399391
},
400392
"outputs": [
401393
{
402394
"data": {
403395
"text/html": [
404-
"<strong style='color: #00008B;'>Ancient Rome was a significant civilization that made significant contributions to human history. Some of their major achievements include:<br><br>1. The construction of the Colosseum, one of the largest amphitheaters in the world, which served as a venue for gladiatorial games and other public spectacles.<br><br>2. The development of Roman law, which established the principles of justice and legal procedures that are still used today.<br><br>3. The invention of the horse-drawn carriage, which allowed for faster transportation and trade.<br><br>4. The construction of aqueducts that provided water to cities and towns, improving living conditions and economic activity.<br><br>5. The</strong>"
396+
"<strong style='color: #00008B;'>The ancient Romans made significant contributions to various fields, including law, philosophy, science, and literature. They are known for their extensive use of the Latin language and their innovative approach to governance. Rome's achievements include the construction of the Colosseum, which was a massive amphitheater that hosted gladiatorial contests and other public spectacles. The Roman Empire, which lasted from the 3rd century BCE to the 4th century CE, is considered one of the most influential empires in history.</strong>"
405397
],
406398
"text/plain": [
407399
"<IPython.core.display.HTML object>"
@@ -450,18 +442,50 @@
450442
"execution_count": 4,
451443
"metadata": {
452444
"execution": {
453-
"iopub.execute_input": "2025-10-06T03:38:41.151833Z",
454-
"iopub.status.busy": "2025-10-06T03:38:41.151685Z",
455-
"iopub.status.idle": "2025-10-06T03:38:41.252737Z",
456-
"shell.execute_reply": "2025-10-06T03:38:41.252288Z"
445+
"iopub.execute_input": "2025-10-06T04:20:10.097679Z",
446+
"iopub.status.busy": "2025-10-06T04:20:10.097535Z",
447+
"iopub.status.idle": "2025-10-06T04:20:10.540590Z",
448+
"shell.execute_reply": "2025-10-06T04:20:10.540114Z"
457449
}
458450
},
459451
"outputs": [
460452
{
461453
"name": "stdout",
462454
"output_type": "stream",
463455
"text": [
464-
"Yes, I am Qwen, a language model created by Alibaba Cloud. My purpose is to assist you with any questions or tasks you may have. If you have any questions or would like to talk about a specific topic, feel free to ask!"
456+
"Yes, \"test\" is a common term used in various contexts to refer to a simulated situation, a set of instructions, or an evaluation of performance. Here are some examples of how \"test\" might be used:\n",
457+
"\n",
458+
"1. In software testing, \"test\" refers to a program that checks for defects in a software system.\n",
459+
"\n",
460+
"2. In a chemistry test, \"test\" refers to the procedure used to determine whether a sample of a compound has reacted with another substance.\n",
461+
"\n",
462+
"3. In a coding test, \"test\" refers to an automated program that runs a program and checks its correctness.\n",
463+
"\n",
464+
"4. In a language learning test, \"test\" refers to a computer program that evaluates a learner's progress in"
465+
]
466+
},
467+
{
468+
"name": "stdout",
469+
"output_type": "stream",
470+
"text": [
471+
" understanding a particular language.\n",
472+
"\n",
473+
"5. In a physical test, \"test\" refers to the process of measuring or assessing something, such as a physical property or performance.\n",
474+
"\n",
475+
"6. In a sports test, \"test\" refers to an official event where athletes compete against each other.\n",
476+
"\n",
477+
"7. In a scientific test, \"test\" refers to a method used to investigate a particular phenomenon or determine the effectiveness of a treatment.\n",
478+
"\n",
479+
"8. In a medical test, \"test\" refers to the examination or diagnostic process to determine the medical condition of a patient.\n",
480+
"\n",
481+
"All of these uses of \"test\" indicate a scenario where a specified action or set of actions is carried out to evaluate or assess"
482+
]
483+
},
484+
{
485+
"name": "stdout",
486+
"output_type": "stream",
487+
"text": [
488+
" a performance or outcome."
465489
]
466490
}
467491
],
@@ -491,17 +515,17 @@
491515
"execution_count": 5,
492516
"metadata": {
493517
"execution": {
494-
"iopub.execute_input": "2025-10-06T03:38:41.254144Z",
495-
"iopub.status.busy": "2025-10-06T03:38:41.254004Z",
496-
"iopub.status.idle": "2025-10-06T03:38:41.404226Z",
497-
"shell.execute_reply": "2025-10-06T03:38:41.403853Z"
518+
"iopub.execute_input": "2025-10-06T04:20:10.542027Z",
519+
"iopub.status.busy": "2025-10-06T04:20:10.541882Z",
520+
"iopub.status.idle": "2025-10-06T04:20:10.698366Z",
521+
"shell.execute_reply": "2025-10-06T04:20:10.697945Z"
498522
}
499523
},
500524
"outputs": [
501525
{
502526
"data": {
503527
"text/html": [
504-
"<strong style='color: #00008B;'>Response: Completion(id='3be3295d77d44db9a1843f154ee197a7', choices=[CompletionChoice(finish_reason='length', index=0, logprobs=None, text=' 1. United States - Washington D.C.\\n2. Canada - Ottawa\\n3. France - Paris\\n4. Germany - Berlin\\n5. Japan - Tokyo\\n6. Italy - Rome\\n7. Spain - Madrid\\n8. United Kingdom - London\\n9. Australia - Canberra\\n10. New Zealand', matched_stop=None)], created=1759721921, model='qwen/qwen2.5-0.5b-instruct', object='text_completion', system_fingerprint=None, usage=CompletionUsage(completion_tokens=64, prompt_tokens=8, total_tokens=72, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
528+
"<strong style='color: #00008B;'>Response: Completion(id='6f88b33ba1bc4d8d82b9a15ee30e156b', choices=[CompletionChoice(finish_reason='length', index=0, logprobs=None, text=' 1. United States - Washington D.C.\\n2. Canada - Ottawa\\n3. France - Paris\\n4. Germany - Berlin\\n5. Japan - Tokyo\\n6. Italy - Rome\\n7. Spain - Madrid\\n8. United Kingdom - London\\n9. Australia - Canberra\\n10. New Zealand', matched_stop=None)], created=1759724410, model='qwen/qwen2.5-0.5b-instruct', object='text_completion', system_fingerprint=None, usage=CompletionUsage(completion_tokens=64, prompt_tokens=8, total_tokens=72, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
505529
],
506530
"text/plain": [
507531
"<IPython.core.display.HTML object>"
@@ -540,17 +564,17 @@
540564
"execution_count": 6,
541565
"metadata": {
542566
"execution": {
543-
"iopub.execute_input": "2025-10-06T03:38:41.405600Z",
544-
"iopub.status.busy": "2025-10-06T03:38:41.405462Z",
545-
"iopub.status.idle": "2025-10-06T03:38:41.558349Z",
546-
"shell.execute_reply": "2025-10-06T03:38:41.557974Z"
567+
"iopub.execute_input": "2025-10-06T04:20:10.700748Z",
568+
"iopub.status.busy": "2025-10-06T04:20:10.700605Z",
569+
"iopub.status.idle": "2025-10-06T04:20:10.786008Z",
570+
"shell.execute_reply": "2025-10-06T04:20:10.785601Z"
547571
}
548572
},
549573
"outputs": [
550574
{
551575
"data": {
552576
"text/html": [
553-
"<strong style='color: #00008B;'>Response: Completion(id='8061143f030d483183cae76728e120c0', choices=[CompletionChoice(finish_reason='stop', index=0, logprobs=None, text=' Once upon a time, there was a space explorer named Dr. Amelia Hart. She had been on many missions to explore the stars and planets, but never before had she been in space with anyone.', matched_stop='\\n\\n')], created=1759721921, model='qwen/qwen2.5-0.5b-instruct', object='text_completion', system_fingerprint=None, usage=CompletionUsage(completion_tokens=40, prompt_tokens=9, total_tokens=49, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
577+
"<strong style='color: #00008B;'>Response: Completion(id='721840baf7824385a71fc9221d73e24e', choices=[CompletionChoice(finish_reason='stop', index=0, logprobs=None, text=' Once upon a time, there was a space explorer named Jack who had always dreamed of exploring the stars. He had heard tales of the vastness of the universe and how it was filled with strange and beautiful wonders.', matched_stop='\\n\\n')], created=1759724410, model='qwen/qwen2.5-0.5b-instruct', object='text_completion', system_fingerprint=None, usage=CompletionUsage(completion_tokens=43, prompt_tokens=9, total_tokens=52, completion_tokens_details=None, prompt_tokens_details=None, reasoning_tokens=0), metadata={'weight_version': 'default'})</strong>"
554578
],
555579
"text/plain": [
556580
"<IPython.core.display.HTML object>"
@@ -591,10 +615,10 @@
591615
"execution_count": 7,
592616
"metadata": {
593617
"execution": {
594-
"iopub.execute_input": "2025-10-06T03:38:41.559683Z",
595-
"iopub.status.busy": "2025-10-06T03:38:41.559549Z",
596-
"iopub.status.idle": "2025-10-06T03:38:41.618507Z",
597-
"shell.execute_reply": "2025-10-06T03:38:41.617987Z"
618+
"iopub.execute_input": "2025-10-06T04:20:10.787486Z",
619+
"iopub.status.busy": "2025-10-06T04:20:10.787351Z",
620+
"iopub.status.idle": "2025-10-06T04:20:10.820339Z",
621+
"shell.execute_reply": "2025-10-06T04:20:10.819713Z"
598622
}
599623
},
600624
"outputs": [],

0 commit comments

Comments
 (0)