From bf6645168a6754711f065c7fc844e3dd88037894 Mon Sep 17 00:00:00 2001 From: Yuyan Peng Date: Fri, 17 Jan 2025 06:42:42 +0000 Subject: [PATCH] Fix instruction for serving trillium Mixtral 8x22B model Remove the extra space that cause command errors when copying. --- Serving/Trillium/JetStream-Maxtext/Mixtral-8X22B/README.md | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/Serving/Trillium/JetStream-Maxtext/Mixtral-8X22B/README.md b/Serving/Trillium/JetStream-Maxtext/Mixtral-8X22B/README.md index cd544e3..789a657 100644 --- a/Serving/Trillium/JetStream-Maxtext/Mixtral-8X22B/README.md +++ b/Serving/Trillium/JetStream-Maxtext/Mixtral-8X22B/README.md @@ -63,7 +63,8 @@ python MaxText/maxengine_server.py \ scan_layers=${SCAN_LAYERS} \ weight_dtype=${WEIGHT_DTYPE} \ per_device_batch_size=${PER_DEVICE_BATCH_SIZE} \ - megablox=False capacity_factor=-1 \ + megablox=False \ + capacity_factor=-1 \ quantization=int8 checkpoint_is_quantized=True \ quantize_kvcache=True ```