parthnuwal7 commited on
Commit
95fbfc5
·
1 Parent(s): 5b0f561

ATPC fixes

Browse files
Files changed (2) hide show
  1. Dockerfile +2 -2
  2. src/utils/data_processor.py +9 -14
Dockerfile CHANGED
@@ -17,8 +17,8 @@ COPY . .
17
  # Install Python dependencies
18
  RUN pip install --no-cache-dir -r requirements.txt
19
 
20
- # Pre-download PyABSA checkpoint during build to avoid runtime git issues
21
- RUN python -c "import pyabsa; from pyabsa import ATEPCCheckpointManager; ATEPCCheckpointManager.get_checkpoint('multilingual')" || echo "PyABSA checkpoint download failed, will retry at runtime"
22
 
23
  # Expose port
24
  EXPOSE 7860
 
17
  # Install Python dependencies
18
  RUN pip install --no-cache-dir -r requirements.txt
19
 
20
+ # Pre-download PyABSA checkpoint during build (using correct v2.4.2 API)
21
+ RUN python -c "from pyabsa import available_checkpoints; print('Available checkpoints:', available_checkpoints()); from pyabsa import checkpoint_utils; checkpoint_utils.download_all_available_checkpoints()" || echo "PyABSA checkpoint download skipped, will download at runtime"
22
 
23
  # Expose port
24
  EXPOSE 7860
src/utils/data_processor.py CHANGED
@@ -215,7 +215,6 @@ class ABSAProcessor:
215
  warnings.filterwarnings('ignore', category=DeprecationWarning)
216
 
217
  import pyabsa
218
- from pyabsa import ATEPCCheckpointManager
219
 
220
  # Check if git is available
221
  try:
@@ -228,20 +227,16 @@ class ABSAProcessor:
228
  except Exception as git_err:
229
  logger.warning(f"Git not found or not executable: {str(git_err)}")
230
 
231
- # Try local checkpoint first (if exists in checkpoints/ directory)
232
- local_checkpoint = os.path.join(os.path.dirname(__file__), '..', '..', 'checkpoints', 'ATEPC_MULTILINGUAL_CHECKPOINT')
 
 
233
 
234
- if os.path.exists(local_checkpoint):
235
- logger.info(f"Loading PyABSA from local checkpoint: {local_checkpoint}")
236
- self.model = pyabsa.load_aspect_extractor(checkpoint=local_checkpoint)
237
- logger.info("✅ PyABSA model loaded successfully from local checkpoint")
238
- else:
239
- # Fallback to downloading checkpoint (requires git)
240
- logger.info("Local checkpoint not found, downloading multilingual checkpoint...")
241
- logger.info("This may take a few minutes on first run...")
242
- checkpoint = ATEPCCheckpointManager.get_checkpoint('multilingual')
243
- self.model = pyabsa.load_aspect_extractor(checkpoint=checkpoint)
244
- logger.info("✅ PyABSA model loaded successfully from downloaded checkpoint")
245
 
246
  except Exception as e:
247
  import traceback
 
215
  warnings.filterwarnings('ignore', category=DeprecationWarning)
216
 
217
  import pyabsa
 
218
 
219
  # Check if git is available
220
  try:
 
227
  except Exception as git_err:
228
  logger.warning(f"Git not found or not executable: {str(git_err)}")
229
 
230
+ # Try to load aspect extractor with multilingual checkpoint
231
+ # PyABSA v2.4.2 handles checkpoint downloading automatically
232
+ logger.info("Loading PyABSA multilingual model...")
233
+ logger.info("This may take a few minutes on first run (downloading checkpoint)...")
234
 
235
+ self.model = pyabsa.load_aspect_extractor(
236
+ checkpoint='multilingual',
237
+ auto_device=True # Let PyABSA choose device (CPU in this case)
238
+ )
239
+ logger.info("✅ PyABSA model loaded successfully")
 
 
 
 
 
 
240
 
241
  except Exception as e:
242
  import traceback