We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a09ee0b commit 19ef7e2Copy full SHA for 19ef7e2
inference/generativeai/llm-workshop/deploy-V7-lmi/llama2_70b_lmi_v7.ipynb
@@ -242,9 +242,9 @@
242
"%%writefile ./code_llama2/serving.properties\n",
243
"engine = MPI\n",
244
"option.model_id = {{s3url}}\n",
245
- "option.task = text - generation\n",
+ "option.task = text-generation\n",
246
"option.tensor_parallel_degree = 8\n",
247
- "option.rolling_batch = lmi - dist\n",
+ "option.rolling_batch = lmi-dist\n",
248
"option.output_formatter = json\n",
249
"option.max_rolling_batch_size = 64\n",
250
"option.model_loading_timeout = 3600"
0 commit comments