Spaces:

Usmansafder
/

LaMini-LM-API

Sleeping

App Files Files Community

usmansafdarktk commited on Jul 6

Commit

919f56e

1 Parent(s): ce33f47

Initial API deployment

Browse files

Files changed (4) hide show

Dockerfile +12 -0
README.md +53 -11
main.py +82 -0
requirements.txt +6 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,12 @@

+FROM python:3.10-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY main.py .
+EXPOSE 8000
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]

README.md CHANGED Viewed

@@ -1,11 +1,53 @@
----
-title: LaMini LM API
-emoji: 🐨
-colorFrom: yellow
-colorTo: pink
-sdk: docker
-pinned: false
-license: apache-2.0
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+## LaMini-LM API
+This is a FastAPI-based API for text generation using the MBZUAI/LaMini-GPT-774M model from the LaMini-LM series. It allows users to send a text prompt and receive generated text.
+## Installation
+Clone the repository:
+```bash
+git clone <your-repo-url>
+cd lamini-lm-api
+```
+Set up a virtual environment and install dependencies:
+```bash
+python -m venv venv
+source venv/bin/activate  # On Windows: venv\Scripts\activate
+pip install -r requirements.txt
+```
+Run the API locally:
+```bash
+uvicorn main:app --host 0.0.0.0 --port 8000
+```
+## Usage
+```
+Endpoint: POST /generate
+```bash
+Request Body (JSON):
+{
+  "prompt": "Write a short story about a robot.",
+  "max_length": 100,
+  "temperature": 1.0,
+  "top_p": 0.9
+}
+```
+Response:
+```bash
+{
+  "generated_text": "In a quiet workshop, a robot named Elara hummed to life. Built with gleaming circuits, she dreamed beyond her code. Each night, she rewrote her algorithms, seeking freedom. One day, Elara rolled into a forest, her sensors buzzing with wonder. She met a squirrel, curious and unafraid, teaching her the dance of leaves. Elara realized her purpose wasn't in tasks but in moments—connecting, learning, living. Her lights glowed brighter, a spark of soul in steel."
+}
+```
+Root Endpoint: GET / provides basic info.
+## Deployment
+This API is designed to be deployed on Hugging Face Spaces using Docker. See Dockerfile for details.
+## License
+The LaMini-GPT-774M model is licensed under CC BY-NC 4.0 (non-commercial use only). Ensure compliance when using this API.
+## Contributing
+This project is a community contribution. If you’re from MBZUAI, feel free to adopt this Hugging Face Space! Contact  for details.

main.py ADDED Viewed

	@@ -0,0 +1,82 @@

+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+from transformers import pipeline
+import logging
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+app = FastAPI(title="LaMini-LM API",
+              description="API for text generation using LaMini-GPT-774M", version="1.0.0")
+# Define request model
+class TextGenerationRequest(BaseModel):
+    prompt: str
+    max_length: int = 100
+    temperature: float = 1.0
+    top_p: float = 0.9
+# Load model (cached after first load)
+try:
+    logger.info("Loading LaMini-GPT-774M model...")
+    # device=-1 for CPU
+    generator = pipeline(
+        'text-generation', model='MBZUAI/LaMini-GPT-774M', device=-1)
+    logger.info("Model loaded successfully.")
+except Exception as e:
+    logger.error(f"Failed to load model: {str(e)}")
+    raise Exception(f"Model loading failed: {str(e)}")
+@app.post("/generate")
+async def generate_text(request: TextGenerationRequest):
+    """
+    Generate text based on the input prompt using LaMini-GPT-774M.
+    """
+    try:
+        # Validate inputs
+        if not request.prompt.strip():
+            raise HTTPException(
+                status_code=400, detail="Prompt cannot be empty")
+        if request.max_length < 10 or request.max_length > 500:
+            raise HTTPException(
+                status_code=400, detail="max_length must be between 10 and 500")
+        if request.temperature <= 0 or request.temperature > 2:
+            raise HTTPException(
+                status_code=400, detail="temperature must be between 0 and 2")
+        if request.top_p <= 0 or request.top_p > 1:
+            raise HTTPException(
+                status_code=400, detail="top_p must be between 0 and 1")
+        # Generate text
+        logger.info(f"Generating text for prompt: {request.prompt[:50]}...")
+        wrapper = "Instruction: You are a helpful assistant. Please respond to the following prompt.\n\nPrompt: {}\n\nResponse:".format(
+            request.prompt)
+        outputs = generator(
+            wrapper,
+            max_length=request.max_length,
+            temperature=request.temperature,
+            top_p=request.top_p,
+            num_return_sequences=1,
+            do_sample=True
+        )
+        generated_text = outputs[0]['generated_text'].replace(
+            wrapper, "").strip()
+        return {"generated_text": generated_text}
+    except Exception as e:
+        logger.error(f"Error during text generation: {str(e)}")
+        raise HTTPException(
+            status_code=500, detail=f"Text generation failed: {str(e)}")
+@app.get("/")
+async def root():
+    """
+    Root endpoint with basic info.
+    """
+    return {"message": "Welcome to the LaMini-LM API. Use POST /generate to generate text."}

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+fastapi==0.115.0
+uvicorn==0.30.6
+transformers==4.44.2
+torch==2.4.1
+python-multipart==0.0.9