hmm183 commited on
Commit
71469fb
·
verified ·
1 Parent(s): 4028fbb

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -3
app.py CHANGED
@@ -1,13 +1,16 @@
 
 
 
 
1
  from flask import Flask, request, jsonify
2
  from flask_cors import CORS
3
- import os
4
  # No requests import needed for Ollama connection check if not using Ollama
5
 
6
  # Import Hugging Face Transformers
7
  from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
8
- import torch # For checking GPU availability
9
 
10
- from langchain_community.embeddings import HuggingFaceEmbeddings # Using HF Embeddings now
11
  from langchain_community.vectorstores import Chroma
12
  from langchain_core.documents import Document
13
  from langchain_core.prompts import ChatPromptTemplate
@@ -18,6 +21,7 @@ from langchain_text_splitters import RecursiveCharacterTextSplitter
18
  app = Flask(__name__)
19
  CORS(app)
20
 
 
21
  # --- Model Configuration for Hugging Face Transformers ---
22
  # CHOOSE A SMALLER MODEL! Gemma 4B is too large for free tier usually.
23
  # 'google/gemma-2b-it' is a good conversational starting point.
 
1
+ import os # Import os at the top
2
+ # Set a writable cache directory for transformers
3
+ os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface"
4
+
5
  from flask import Flask, request, jsonify
6
  from flask_cors import CORS
 
7
  # No requests import needed for Ollama connection check if not using Ollama
8
 
9
  # Import Hugging Face Transformers
10
  from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
11
+ import torch
12
 
13
+ from langchain_community.embeddings import HuggingFaceEmbeddings
14
  from langchain_community.vectorstores import Chroma
15
  from langchain_core.documents import Document
16
  from langchain_core.prompts import ChatPromptTemplate
 
21
  app = Flask(__name__)
22
  CORS(app)
23
 
24
+ # ... (rest of your app.py code) ...
25
  # --- Model Configuration for Hugging Face Transformers ---
26
  # CHOOSE A SMALLER MODEL! Gemma 4B is too large for free tier usually.
27
  # 'google/gemma-2b-it' is a good conversational starting point.