File size: 3,937 Bytes
afad319
 
 
 
 
 
 
 
 
 
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
192b2d2
afad319
 
 
192b2d2
afad319
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
# =============================================================================
# RAG System Dependencies for Hugging Face Spaces Deployment
# =============================================================================
# This file contains all the Python packages required for the RAG system
# to function properly in a Docker container environment.

# =============================================================================
# CORE WEB FRAMEWORK
# =============================================================================

# Streamlit - Modern web framework for data applications
# Provides the interactive web interface for the RAG system
streamlit==1.28.1

# =============================================================================
# DEEP LEARNING & AI FRAMEWORKS
# =============================================================================

# PyTorch - Deep learning framework for model inference
# Required for running the language models (Qwen, distilgpt2)
torch==2.1.0

# Transformers - Hugging Face library for pre-trained models
# Provides access to language models and tokenizers
transformers>=4.36.0

# =============================================================================
# EMBEDDING & VECTOR SEARCH
# =============================================================================

# Sentence Transformers - Library for sentence embeddings
# Used for converting text to vector representations
sentence-transformers==2.2.2

# FAISS CPU - Facebook AI Similarity Search for vector indexing
# Provides efficient similarity search for document retrieval
faiss-cpu==1.7.4

# =============================================================================
# MACHINE LEARNING & DATA PROCESSING
# =============================================================================

# Scikit-learn - Machine learning utilities
# Used for data preprocessing and BM25 implementation
scikit-learn==1.3.2

# Rank BM25 - Implementation of BM25 ranking algorithm
# Provides keyword-based sparse retrieval functionality
rank-bm25==0.2.2

# =============================================================================
# DOCUMENT PROCESSING
# =============================================================================

# PyPDF - Modern PDF processing library
# Used for extracting text and metadata from PDF documents
pypdf==3.17.1

# =============================================================================
# DATA MANIPULATION & ANALYSIS
# =============================================================================

# Pandas - Data manipulation and analysis library
# Used for data structure management and processing
pandas==2.1.3

# NumPy - Numerical computing library
# Provides mathematical operations and array handling
numpy==1.24.3

# =============================================================================
# UTILITIES & LOGGING
# =============================================================================

# Loguru - Advanced logging library
# Provides structured logging with better formatting and features
loguru==0.7.2

# TQDM - Progress bar library
# Shows progress for long-running operations
tqdm==4.66.1

# =============================================================================
# MODEL OPTIMIZATION & DEPLOYMENT
# =============================================================================

# Accelerate - Hugging Face library for model optimization
# Helps with model loading and inference optimization
accelerate==0.24.1

# Hugging Face Hub - Library for accessing Hugging Face models
# Provides utilities for downloading and managing models
huggingface-hub==0.19.4

# =============================================================================
# GUARD RAIL DEPENDENCIES
# =============================================================================

# Additional libraries for enhanced security and validation
# These are optional but recommended for production deployments