Spaces:

accelera-ai
/

open_mp_generator

Sleeping

App Files Files Community

mohamedahraf273 commited on Mar 16

Commit

5202b5c

1 Parent(s): 3e4a1d2

add api

Browse files

Files changed (4) hide show

Dockerfile +16 -0
app.py +114 -0
generator.ipynb +17 -2
requirements.txt +12 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,16 @@

+# Read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
+# you will also find guides on how best to write your Dockerfile
+FROM python:3.9
+RUN useradd -m -u 1000 user
+USER user
+ENV PATH="/home/user/.local/bin:$PATH"
+WORKDIR /app
+COPY --chown=user ./requirements.txt requirements.txt
+RUN pip install --no-cache-dir --upgrade -r requirements.txt
+COPY --chown=user . /app
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

app.py ADDED Viewed

	@@ -0,0 +1,114 @@

+import sys
+import pathlib
+import os
+import torch
+import re
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+sys.path.append(str(pathlib.Path(__file__).parent.resolve()))
+from tokenizer import Tokenizer
+from model.generator import Generator
+from model.encoder import Encoder
+from model.decoder import Decoder
+from model.attn import BahdanauAttention
+app = FastAPI()
+BASE_DIR = pathlib.Path(__file__).parent
+TOKENIZER_PATH = BASE_DIR / "tokenizer.json"
+CHECKPOINT_PATH = BASE_DIR / "best_model.pth"
+VOCAB_SIZE = 8000
+EMBED_SIZE = 128
+HIDDEN_SIZE = 256
+NUM_LAYERS = 3
+DROPOUT = 0.2
+device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+tokenizer = None
+model = None
+SOS_IDX = None
+EOS_IDX = None
+PAD_IDX = None
+class GenerationRequest(BaseModel):
+    code_snippet: str
+    cls: str = "parallel" # default
+    max_len: int = 100
+@app.on_event("startup")
+def load_resources():
+    global tokenizer, model, SOS_IDX, EOS_IDX, PAD_IDX
+    if not TOKENIZER_PATH.exists():
+        raise FileNotFoundError(f"Tokenizer not found at {TOKENIZER_PATH}")
+    tokenizer = Tokenizer(vocab_size=8000)
+    tokenizer.load(str(TOKENIZER_PATH))
+    SOS_IDX = tokenizer.char2idx['<SOS>']
+    EOS_IDX = tokenizer.char2idx['<EOS>']
+    PAD_IDX = tokenizer.char2idx['<PAD>']
+    actual_vocab_size = tokenizer.vocab_size
+    encoder = Encoder(actual_vocab_size, EMBED_SIZE, HIDDEN_SIZE, NUM_LAYERS, DROPOUT)
+    attention = BahdanauAttention(HIDDEN_SIZE)
+    decoder = Decoder(actual_vocab_size, EMBED_SIZE, HIDDEN_SIZE, attention, NUM_LAYERS, DROPOUT)
+    model = Generator(encoder, decoder, device).to(device)
+    if not CHECKPOINT_PATH.exists():
+        print("WARNING: Checkpoint not found. Model will be random!")
+        return
+    checkpoint = torch.load(str(CHECKPOINT_PATH), map_location=device)
+    model.load_state_dict(checkpoint['model_state_dict'])
+    model.eval()
+def greedy_generate(code_snippet: str, cls: str, max_len: int) -> str:
+    if model is None or tokenizer is None:
+        raise HTTPException(status_code=503, detail="Model not loaded")
+    model.eval()
+    text = code_snippet if code_snippet.startswith("[CLS:") else f"[CLS:{cls}] {code_snippet}"
+    input_ids = tokenizer.encode(text, max_length=1500, add_special_tokens=True)
+    input_len = next((i for i, tok in enumerate(input_ids) if tok == PAD_IDX), len(input_ids))
+    input_tensor = torch.tensor([input_ids], device=device)
+    input_len_tensor = torch.tensor([input_len], device=device)
+    with torch.no_grad():
+        enc_outs, hidden, cell = model.encoder(input_tensor, input_len_tensor)
+        mask = (torch.arange(enc_outs.size(1), device=device).unsqueeze(0) < input_len_tensor.unsqueeze(1)).float()
+        hidden = hidden.view(model.encoder.num_layers, 2, 1, model.encoder.hidden_size)
+        hidden = torch.cat((hidden[:, 0], hidden[:, 1]), dim=2)
+        hidden = model.hidden_projection(hidden)
+        cell = cell.view(model.encoder.num_layers, 2, 1, model.encoder.hidden_size)
+        cell = torch.cat((cell[:, 0], cell[:, 1]), dim=2)
+        cell = model.cell_projection(cell)
+        input_token = torch.tensor([SOS_IDX], device=device)
+        generated = []
+        for _ in range(max_len):
+            output, hidden, cell, _ = model.decoder(input_token, hidden, cell, enc_outs, mask)
+            top1 = output.argmax(1)
+            token_id = top1.item()
+            if token_id == EOS_IDX:
+                break
+            generated.append(token_id)
+            input_token = top1
+    return tokenizer.decode(generated)
+@app.post("/generate")
+def generate_code_snippet(request: GenerationRequest):
+    try:
+        if not request.code_snippet.strip():
+             return {"pragma": ""}
+        cleaned_code = request.code_snippet.strip()
+        result = greedy_generate(cleaned_code, request.cls, request.max_len)
+        return {"pragma": result}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))

generator.ipynb CHANGED Viewed

@@ -309,10 +309,25 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
    "id": "6d9a8e25",
    "metadata": {},
-   "outputs": [],
    "source": [
     "\n",
     "import sys\n",

   },
   {
    "cell_type": "code",
+   "execution_count": 18,
    "id": "6d9a8e25",
    "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loaded checkpoint from best_model.pth (epoch 8)\n",
+      "Sample input (truncated): [CLS:reduction] for (i = 0; i < 1000; ++i)\n",
+      "{\n",
+      "  logic_and = logic_and && logics[i];\n",
+      "}\n",
+      "\n",
+      "Reference pragma: omp parallel for schedule(dynamic,1) private(i) reduction(&&:logic_and)\n",
+      "Greedy prediction: omp parallel for schedule(dynamic,1) private(i) reduction(&&:logic_and)\n"
+     ]
+    }
+   ],
    "source": [
     "\n",
     "import sys\n",

requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+# Core Python Utilities
+setuptools
+regex
+packaging
+build
+dm-tree
+scikit-learn
+pandas
+numpy
+torch
+fastapi
+uvicorn[standard]