Update app.py
Browse files
app.py
CHANGED
|
@@ -1,13 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
from flask import Flask, request, jsonify
|
| 2 |
from flask_cors import CORS
|
| 3 |
-
import os
|
| 4 |
# No requests import needed for Ollama connection check if not using Ollama
|
| 5 |
|
| 6 |
# Import Hugging Face Transformers
|
| 7 |
from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
|
| 8 |
-
import torch
|
| 9 |
|
| 10 |
-
from langchain_community.embeddings import HuggingFaceEmbeddings
|
| 11 |
from langchain_community.vectorstores import Chroma
|
| 12 |
from langchain_core.documents import Document
|
| 13 |
from langchain_core.prompts import ChatPromptTemplate
|
|
@@ -18,6 +21,7 @@ from langchain_text_splitters import RecursiveCharacterTextSplitter
|
|
| 18 |
app = Flask(__name__)
|
| 19 |
CORS(app)
|
| 20 |
|
|
|
|
| 21 |
# --- Model Configuration for Hugging Face Transformers ---
|
| 22 |
# CHOOSE A SMALLER MODEL! Gemma 4B is too large for free tier usually.
|
| 23 |
# 'google/gemma-2b-it' is a good conversational starting point.
|
|
|
|
| 1 |
+
import os # Import os at the top
|
| 2 |
+
# Set a writable cache directory for transformers
|
| 3 |
+
os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface"
|
| 4 |
+
|
| 5 |
from flask import Flask, request, jsonify
|
| 6 |
from flask_cors import CORS
|
|
|
|
| 7 |
# No requests import needed for Ollama connection check if not using Ollama
|
| 8 |
|
| 9 |
# Import Hugging Face Transformers
|
| 10 |
from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
|
| 11 |
+
import torch
|
| 12 |
|
| 13 |
+
from langchain_community.embeddings import HuggingFaceEmbeddings
|
| 14 |
from langchain_community.vectorstores import Chroma
|
| 15 |
from langchain_core.documents import Document
|
| 16 |
from langchain_core.prompts import ChatPromptTemplate
|
|
|
|
| 21 |
app = Flask(__name__)
|
| 22 |
CORS(app)
|
| 23 |
|
| 24 |
+
# ... (rest of your app.py code) ...
|
| 25 |
# --- Model Configuration for Hugging Face Transformers ---
|
| 26 |
# CHOOSE A SMALLER MODEL! Gemma 4B is too large for free tier usually.
|
| 27 |
# 'google/gemma-2b-it' is a good conversational starting point.
|