Skip to content

Commit 05548d6

Browse files
committed
Updated the llama2-7b and llama2-13b notebooks to use the latest DLC image,i.e 0.26
1 parent cb9c822 commit 05548d6

File tree

3 files changed

+405
-20
lines changed

3 files changed

+405
-20
lines changed

inference/generativeai/llm-workshop/lab11-llama2/meta-llama-2-13b-lmi.ipynb

Lines changed: 7 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -250,15 +250,13 @@
250250
"source": [
251251
"%%writefile code_llama2_13b_fp16/serving.properties\n",
252252
"engine = MPI\n",
253-
"option.tensor_parallel_degree = 4\n",
253+
"option.tensor_parallel_degree = max\n",
254254
"option.rolling_batch = auto\n",
255-
"option.max_rolling_batch_size = 8\n",
255+
"option.max_rolling_batch_size = 32\n",
256256
"option.model_loading_timeout = 3600\n",
257257
"option.model_id = {{model_id}}\n",
258-
"option.paged_attention = true\n",
259258
"option.trust_remote_code = true\n",
260-
"option.dtype = fp16\n",
261-
"option.enable_streaming=True"
259+
"option.dtype = fp16"
262260
]
263261
},
264262
{
@@ -296,7 +294,7 @@
296294
"outputs": [],
297295
"source": [
298296
"inference_image_uri = image_uris.retrieve(\n",
299-
" framework=\"djl-deepspeed\", region=region, version=\"0.23.0\"\n",
297+
" framework=\"djl-deepspeed\", region=region, version=\"0.26.0\"\n",
300298
")\n",
301299
"print(f\"Image going to be used is ---- > {inference_image_uri}\")"
302300
]
@@ -1134,9 +1132,9 @@
11341132
],
11351133
"instance_type": "ml.t3.medium",
11361134
"kernelspec": {
1137-
"display_name": "Python 3 (PyTorch 2.0.0 Python 3.10 CPU Optimized)",
1135+
"display_name": "conda_pytorch_p310",
11381136
"language": "python",
1139-
"name": "python3__SAGEMAKER_INTERNAL__arn:aws:sagemaker:us-west-2:236514542706:image/pytorch-2.0.0-cpu-py310"
1137+
"name": "conda_pytorch_p310"
11401138
},
11411139
"language_info": {
11421140
"codemirror_mode": {
@@ -1148,7 +1146,7 @@
11481146
"name": "python",
11491147
"nbconvert_exporter": "python",
11501148
"pygments_lexer": "ipython3",
1151-
"version": "3.10.8"
1149+
"version": "3.10.13"
11521150
}
11531151
},
11541152
"nbformat": 4,

0 commit comments

Comments
 (0)