Update __main__.py

Smartappli · web-flow · commit 690aaa111ad5 · 2024-05-04T01:05:48.000+02:00
diff --git a/llama_cpp/server/__main__.py b/llama_cpp/server/__main__.py
@@ -1,23 +1,20 @@
-"""llama-cpp-python server from scratch in a single file.
+"""Example FastAPI server for llama.cpp.
+To run this example:
+```bash
+pip install fastapi uvicorn sse-starlette pydantic-settings
+export MODEL=../models/7B/...
+```
+Then run:
+```
+uvicorn llama_cpp.server.app:create_app --reload
+```
+or
+```
+python3 -m llama_cpp.server
+```
+Then visit http://localhost:8000/docs to see the interactive API docs.
 """
 
-# import llama_cpp
-
-# path = b"../../models/Qwen1.5-0.5B-Chat-GGUF/qwen1_5-0_5b-chat-q8_0.gguf"
-
-# model_params = llama_cpp.llama_model_default_params()
-# model = llama_cpp.llama_load_model_from_file(path, model_params)
-
-# if model is None:
-#     raise RuntimeError(f"Failed to load model from file: {path}")
-
-
-# ctx_params = llama_cpp.llama_context_default_params()
-# ctx = llama_cpp.llama_new_context_with_model(model, ctx_params)
-
-# if ctx is None:
-#     raise RuntimeError("Failed to create context")
-
 
 from __future__ import annotations