Spaces:
Runtime error
Runtime error
| import os | |
| from qdrant_client import QdrantClient | |
| # from cerebras.cloud.sdk import Cerebras | |
| qdrant_client = QdrantClient( | |
| url=os.environ.get('QDRANT_URL'), | |
| api_key=os.environ.get('QDRANT_API_KEY'), | |
| ) | |
| print(qdrant_client.get_collections()) | |
| # client = Cerebras( | |
| # # This is the default and can be omitted | |
| # api_key=os.environ.get("CEREBRAS_API_KEY") | |
| # ) | |
| # stream = client.chat.completions.create( | |
| # messages=[ | |
| # { | |
| # "role": "system", | |
| # "content": "" | |
| # } | |
| # ], | |
| # model="gpt-oss-120b", | |
| # stream=True, | |
| # max_completion_tokens=65536, | |
| # temperature=1, | |
| # top_p=1 | |
| # ) | |
| print() | |
| print(os.environ.get('HF_API_KEY')) | |
| print(os.environ.get('TOGETHER_API_KEY')) | |
| print(os.environ.get('QDRANT_URL')) | |
| print(os.environ.get('QDRANT_API_KEY')) | |
| print(os.environ.get('CEREBRAS_API_KEY')) | |
| """ | |
| Debugging FastAPI: | |
| uvicorn app.py:app --reload | |
| MacOS: | |
| export TOGETHER_API_KEY="YOUR_API_KEY" | |
| Windows: | |
| $env:CEREBRAS_API_KEY = "your_key" | |
| $env:QDRANT_URL = "your_url" | |
| $env:QDRANT_API_KEY = "your_key" | |
| """ | |
| """Token Count Test | |
| INPUT_token_count:10616 | |
| OUTPUT_token_count:4808 | |
| AVG_INPUT_token_count:1061.6 | |
| AVG_OUTPUT_token_count:480.8 | |
| TOTAL_TOKEN_COUNT:[1717 1743 1417 1419 1483 1630 1516 1619 1580 1300] | |
| TOKEN_COUNT_PER_GENERATION - :[15424.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15424.0), 1] | |
| INPUT_token_count:10299.0 | |
| OUTPUT_token_count:5628.0 | |
| AVG_INPUT_token_count:1029.9 | |
| AVG_OUTPUT_token_count:562.8 | |
| TOTAL_TOKEN_COUNT:[1852. 1520. 1615. 1790. 1539. 1562. 1290. 1686. 1460. 1613.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15675.5), 2] | |
| INPUT_token_count:9640.0 | |
| OUTPUT_token_count:5576.0 | |
| AVG_INPUT_token_count:964.0 | |
| AVG_OUTPUT_token_count:557.6 | |
| TOTAL_TOKEN_COUNT:[1252. 1835. 1490. 1537. 1394. 1620. 1670. 1707. 1458. 1253.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15522.333333333334), 3] | |
| INPUT_token_count:9356.0 | |
| OUTPUT_token_count:5277.0 | |
| AVG_INPUT_token_count:935.6 | |
| AVG_OUTPUT_token_count:527.7 | |
| TOTAL_TOKEN_COUNT:[1368. 1295. 1849. 1523. 1468. 1473. 1486. 1426. 1595. 1150.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216. 14633.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15300.0), 4] | |
| INPUT_token_count:9828.0 | |
| OUTPUT_token_count:4758.0 | |
| AVG_INPUT_token_count:982.8 | |
| AVG_OUTPUT_token_count:475.8 | |
| TOTAL_TOKEN_COUNT:[1820. 1235. 1911. 1591. 1312. 1242. 1372. 1533. 1393. 1177.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216. 14633. 14586.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15157.2), 5] | |
| """ | |
| import os | |
| from qdrant_client import QdrantClient | |
| qdrant_client = QdrantClient( | |
| url=os.environ.get('QDRANT_URL'), | |
| api_key=os.environ.get('QDRANT_API_KEY'), | |
| ) | |
| print(qdrant_client.get_collections()) | |
| # qdrant_client.recreate_collection( | |
| # collection_name="programming", | |
| # vectors_config={ | |
| # "my_vector_name": models.VectorParams(size=1536, distance=models.Distance.COSINE), | |
| # }, | |
| # ) | |
| print() | |
| print(os.environ.get('HF_API_KEY')) | |
| print(os.environ.get('TOGETHER_API_KEY')) | |
| print(os.environ.get('QDRANT_URL')) | |
| print(os.environ.get('QDRANT_API_KEY')) | |
| print(os.environ.get('CEREBRAS_API_KEY')) | |
| # cerebras API: your_key | |
| """ | |
| Debugging FastAPI: | |
| uvicorn app.py:app --reload | |
| MacOS: | |
| export TOGETHER_API_KEY="YOUR_API_KEY" | |
| Windows: | |
| $env:CEREBRAS_API_KEY = "your_key" | |
| $env:QDRANT_URL = "your_url" | |
| $env:QDRANT_API_KEY = "your_key" | |
| """ | |
| """Token Count Test | |
| INPUT_token_count:10616 | |
| OUTPUT_token_count:4808 | |
| AVG_INPUT_token_count:1061.6 | |
| AVG_OUTPUT_token_count:480.8 | |
| TOTAL_TOKEN_COUNT:[1717 1743 1417 1419 1483 1630 1516 1619 1580 1300] | |
| TOKEN_COUNT_PER_GENERATION - :[15424.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15424.0), 1] | |
| INPUT_token_count:10299.0 | |
| OUTPUT_token_count:5628.0 | |
| AVG_INPUT_token_count:1029.9 | |
| AVG_OUTPUT_token_count:562.8 | |
| TOTAL_TOKEN_COUNT:[1852. 1520. 1615. 1790. 1539. 1562. 1290. 1686. 1460. 1613.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15675.5), 2] | |
| INPUT_token_count:9640.0 | |
| OUTPUT_token_count:5576.0 | |
| AVG_INPUT_token_count:964.0 | |
| AVG_OUTPUT_token_count:557.6 | |
| TOTAL_TOKEN_COUNT:[1252. 1835. 1490. 1537. 1394. 1620. 1670. 1707. 1458. 1253.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15522.333333333334), 3] | |
| INPUT_token_count:9356.0 | |
| OUTPUT_token_count:5277.0 | |
| AVG_INPUT_token_count:935.6 | |
| AVG_OUTPUT_token_count:527.7 | |
| TOTAL_TOKEN_COUNT:[1368. 1295. 1849. 1523. 1468. 1473. 1486. 1426. 1595. 1150.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216. 14633.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15300.0), 4] | |
| INPUT_token_count:9828.0 | |
| OUTPUT_token_count:4758.0 | |
| AVG_INPUT_token_count:982.8 | |
| AVG_OUTPUT_token_count:475.8 | |
| TOTAL_TOKEN_COUNT:[1820. 1235. 1911. 1591. 1312. 1242. 1372. 1533. 1393. 1177.] | |
| TOKEN_COUNT_PER_GENERATION - :[15424. 15927. 15216. 14633. 14586.] | |
| AVG_TOKEN_COUNT_PER_GENERATION:[np.float64(15157.2), 5] | |
| """ | |