Fix Docs CI When Compile Error (#2323)

786be44d · Chayenne · GitHub · 2db44698 · 786be44d · 786be44d
Unverified Commit 786be44d authored Dec 04, 2024 by Chayenne Committed by GitHub Dec 04, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 7 additions and 7 deletions

docs/Makefile docs/Makefile +1 -1

docs/backend/native_api.ipynb docs/backend/native_api.ipynb +5 -5

python/sglang/srt/server.py python/sglang/srt/server.py +1 -1

No files found.
--- a/docs/Makefile
+++ b/docs/Makefile
@@ -19,7 +19,7 @@ compile:
 			echo "Executing $$nb"; \
 			jupyter nbconvert --to notebook --execute --inplace "$$nb" \
 				--ExecutePreprocessor.timeout=600 \
-				--ExecutePreprocessor.kernel_name=python3; \
+				--ExecutePreprocessor.kernel_name=python3 || exit 1; \
 		fi; \
 	done

--- a/docs/backend/native_api.ipynb
+++ b/docs/backend/native_api.ipynb
@@ -220,19 +220,19 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# failed update with different parameter size\n",
+    "# failed update with different parameter size or wrong name\n",
    "\n",
    "url = \"http://localhost:30010/update_weights_from_disk\"\n",
-    "data = {\"model_path\": \"meta-llama/Llama-3.2-3B\"}\n",
+    "data = {\"model_path\": \"meta-llama/Llama-3.2-1B-wrong\"}\n",
    "\n",
    "response = requests.post(url, json=data)\n",
    "response_json = response.json()\n",
    "print_highlight(response_json)\n",
    "assert response_json[\"success\"] is False\n",
    "assert response_json[\"message\"] == (\n",
-    "    \"Failed to update weights: The size of tensor a (2048) must match \"\n",
+    "    \"Failed to get weights iterator: \"\n",
-    "    \"the size of tensor b (3072) at non-singleton dimension 1.\\n\"\n",
+    "    \"meta-llama/Llama-3.2-1B-wrong\"\n",
-    "    \"Rolling back to original weights.\"\n",
+    "    \" (repository not found).\"\n",
    ")"
   ]
  },

--- a/python/sglang/srt/server.py
+++ b/python/sglang/srt/server.py
@@ -329,7 +329,7 @@ async def encode_request(obj: EmbeddingReqInput, request: Request):
        )
-@app.api_route("/encode", methods=["POST", "PUT"])
+@app.api_route("/classify", methods=["POST", "PUT"])
 @time_func_latency
 async def classify_request(obj: EmbeddingReqInput, request: Request):
    """Handle a reward model request. Now the arguments and return values are the same as embedding models."""