Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
|
@@ -7,6 +7,7 @@ from typing import List, Dict, Tuple, Any
|
|
| 7 |
from pgvector.psycopg2 import register_vector
|
| 8 |
import numpy as np
|
| 9 |
from datetime import datetime
|
|
|
|
| 10 |
|
| 11 |
# ๊ฐ์ค์น ๋ฐ ์๊ณ๊ฐ ์ค์
|
| 12 |
DEFAULT_FULL_WEIGHT = 0.2
|
|
@@ -65,7 +66,10 @@ def search_similar_chat(query: str, max_results: int = 100) -> List[Dict]:
|
|
| 65 |
|
| 66 |
try:
|
| 67 |
# ์ฟผ๋ฆฌ ์๋ฒ ๋ฉ ์์ฑ
|
| 68 |
-
|
|
|
|
|
|
|
|
|
|
| 69 |
|
| 70 |
# DB ์ฐ๊ฒฐ
|
| 71 |
conn = get_db_conn()
|
|
@@ -217,7 +221,10 @@ def search_similar_chat_by_date(
|
|
| 217 |
return []
|
| 218 |
|
| 219 |
# ์ฟผ๋ฆฌ ์๋ฒ ๋ฉ ์์ฑ
|
| 220 |
-
|
|
|
|
|
|
|
|
|
|
| 221 |
|
| 222 |
# DB ์ฐ๊ฒฐ
|
| 223 |
conn = get_db_conn()
|
|
|
|
| 7 |
from pgvector.psycopg2 import register_vector
|
| 8 |
import numpy as np
|
| 9 |
from datetime import datetime
|
| 10 |
+
from sklearn.preprocessing import normalize
|
| 11 |
|
| 12 |
# ๊ฐ์ค์น ๋ฐ ์๊ณ๊ฐ ์ค์
|
| 13 |
DEFAULT_FULL_WEIGHT = 0.2
|
|
|
|
| 66 |
|
| 67 |
try:
|
| 68 |
# ์ฟผ๋ฆฌ ์๋ฒ ๋ฉ ์์ฑ
|
| 69 |
+
raw_embedding = np.array(get_embedding(query))
|
| 70 |
+
# L2 ์ ๊ทํ ์ ์ฉ
|
| 71 |
+
query_embedding = normalize(raw_embedding.reshape(1, -1), norm='l2')[0]
|
| 72 |
+
print(f"์๋ฒ ๋ฉ ์ ๊ทํ ์ /ํ ์ฒซ 5๊ฐ ์์: {raw_embedding[:5]} -> {query_embedding[:5]}")
|
| 73 |
|
| 74 |
# DB ์ฐ๊ฒฐ
|
| 75 |
conn = get_db_conn()
|
|
|
|
| 221 |
return []
|
| 222 |
|
| 223 |
# ์ฟผ๋ฆฌ ์๋ฒ ๋ฉ ์์ฑ
|
| 224 |
+
raw_embedding = np.array(get_embedding(query))
|
| 225 |
+
# L2 ์ ๊ทํ ์ ์ฉ
|
| 226 |
+
query_embedding = normalize(raw_embedding.reshape(1, -1), norm='l2')[0]
|
| 227 |
+
print(f"๋ ์ง ๊ฒ์ - ์๋ฒ ๋ฉ ์ ๊ทํ ์ /ํ ์ฒซ 5๊ฐ ์์: {raw_embedding[:5]} -> {query_embedding[:5]}")
|
| 228 |
|
| 229 |
# DB ์ฐ๊ฒฐ
|
| 230 |
conn = get_db_conn()
|