Spaces:

vetsin
/

SIGIDwiki

Runtime error

vetsin commited on Nov 14, 2025

Commit

86c2562

1 Parent(s): b087b2f

fix: works

Files changed (3) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ .gradio

S5065-MSK.wav ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:30569be92c11907721469fa876588f196bd3e557d9031706d66b56a6c2da6101
+size 1817772

app.py CHANGED Viewed

@@ -1,33 +1,26 @@
-# !pip install gradio transformers torch torchaudio librosa soundfile datasets accelerate
 import gradio as gr
 import json
 from transformers import pipeline
 import warnings
 warnings.filterwarnings("ignore")
-audio_classifier = pipeline("audio-classification", model="ATDI-Group/AST_finetuned_SIGIDwiki")
-# 4. DEFINE THE CORE ANALYSIS FUNCTION
 def analyze_signal(audio_path):
-    """
-    Takes an audio file path and returns a holistic analysis dictionary.
-    """
     if audio_path is None:
         return {"Error": "No audio file provided. Please upload a file."}
     print(f"Analysing audio file: {audio_path}...")
     try:
         acoustic_results = audio_classifier(audio_path, top_k=3)
-        print(repr(acoustic_results))
         detected_sounds = {item['label']: round(item['score'], 2) for item in acoustic_results}
-        # Fuse the results
         holistic_understanding = {
             "Detected Sounds": detected_sounds,
-            #"Insight": f"The model detected speech saying '{transcription}' in an environment with sounds like: {', '.join(detected_sounds.keys())}."
         }
         return holistic_understanding
     except Exception as e:
         return {"Error": f"Could not process the audio file. Details: {str(e)}"}
@@ -40,7 +33,7 @@ iface = gr.Interface(
     description="""
     https://huggingface.co/ATDI-Group/AST_finetuned_SIGIDwiki
     """,
-    examples=[["example.wav"]]
 )
 # This will create the web UI

 import gradio as gr
 import json
 from transformers import pipeline
 import warnings
+from transformers import ASTForAudioClassification, ASTFeatureExtractor
 warnings.filterwarnings("ignore")
+model = ASTForAudioClassification.from_pretrained("ATDI-Group/AST_finetuned_SIGIDwiki", subfolder='AST_finetuned_SIGIDwiki')
+feature_extractor = ASTFeatureExtractor.from_pretrained("ATDI-Group/AST_finetuned_SIGIDwiki", subfolder='AST_finetuned_SIGIDwiki')
+audio_classifier = pipeline("audio-classification", model=model, feature_extractor=feature_extractor)
 def analyze_signal(audio_path):
     if audio_path is None:
         return {"Error": "No audio file provided. Please upload a file."}
     print(f"Analysing audio file: {audio_path}...")
     try:
         acoustic_results = audio_classifier(audio_path, top_k=3)
         detected_sounds = {item['label']: round(item['score'], 2) for item in acoustic_results}
         holistic_understanding = {
             "Detected Sounds": detected_sounds,
         }
         return holistic_understanding
     except Exception as e:
         return {"Error": f"Could not process the audio file. Details: {str(e)}"}
     description="""
     https://huggingface.co/ATDI-Group/AST_finetuned_SIGIDwiki
     """,
+    examples=[["S5065-MSK.wav"]]
 )
 # This will create the web UI