Spaces:

Subodh358
/

CoderSayu-8B-4bit

Runtime error

Subodh358 commited on Jul 10, 2024

Commit

a8a3d39

verified ·

1 Parent(s): 4b76799

Upload 3 files

Files changed (3) hide show

Dockerfile CHANGED Viewed

@@ -1,20 +1,20 @@
-# Use the official PyTorch image with CUDA support
-FROM pytorch/pytorch:2.0.0-cuda11.7-cudnn8-runtime
-# Install git to clone the model repository
-RUN apt-get update && apt-get install -y git
-# Install other dependencies
-RUN pip install transformers
-# Clone the unsloth/llama-3-8b-bnb-4bit model repository
-RUN git clone https://huggingface.co/unsloth/llama-3-8b-bnb-4bit
-# Set the working directory to the model directory
-WORKDIR /unsloth/llama-3-8b-bnb-4bit
-# Copy the inference script
-COPY inference.py .
-# Run the inference script
-CMD ["python", "inference.py"]

+# Use an official Python runtime as a parent image
+FROM python:3.9-slim
+# Set the working directory
+WORKDIR /app
+# Copy the current directory contents into the container at /app
+COPY . /app
+# Install any needed packages specified in requirements.txt
+RUN pip install --no-cache-dir -r requirements.txt
+# Make port 80 available to the world outside this container
+EXPOSE 80
+# Define environment variable
+ENV NAME World
+# Run app.py when the container launches
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "80"]

app.py ADDED Viewed

+from fastapi import FastAPI
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+app = FastAPI()
+# Load the model and tokenizer
+model_name = "unsloth/llama-3-8b-bnb-4bit"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name)
+@app.get("/")
+def read_root():
+    return {"Hello": "World"}
+@app.post("/generate/")
+def generate(prompt: str):
+    inputs = tokenizer(prompt, return_tensors="pt")
+    outputs = model.generate(inputs["input_ids"], max_length=50)
+    text = tokenizer.decode(outputs[0], skip_special_tokens=True)
+    return {"generated_text": text}

requirements.txt ADDED Viewed

+fastapi
+uvicorn
+torch
+transformers