HealthVoiceAnalyzeroneline

Sleeping

App Files Files

xet

Community

geethareddy commited on Jun 24

Commit

9bb4c44

verified ·

1 Parent(s): b694114

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -28

app.py CHANGED Viewed

@@ -26,11 +26,11 @@ def load_whisper_model():
     try:
         model = pipeline(
             "automatic-speech-recognition",
-            model="openai/whisper-tiny.en",
             device=-1,  # CPU; use device=0 for GPU if available
             model_kwargs={"use_safetensors": True}
         )
-        logger.info("Whisper model loaded successfully")
         return model
     except Exception as e:
         logger.error(f"Failed to load Whisper model: {str(e)}")
@@ -52,10 +52,10 @@ def load_symptom_model():
         try:
             model = pipeline(
                 "text-classification",
-                model="distilbert-base-uncased",
                 device=-1
             )
-            logger.warning("Fallback to distilbert-base-uncased model")
             return model
         except Exception as fallback_e:
             logger.error(f"Fallback model failed: {str(fallback_e)}")
@@ -188,8 +188,11 @@ def analyze_voice(audio_file):
         temp_dir = os.path.join(tempfile.gettempdir(), "gradio")
         if not ensure_writable_dir(temp_dir):
-            logger.error(f"Temp directory {temp_dir} not writable")
-            return f"Error: Temp directory {temp_dir} not writable"
         if not os.path.exists(audio_file):
             logger.error(f"Audio file not found: {audio_file}")
@@ -200,12 +203,12 @@ def analyze_voice(audio_file):
             f"audio_{datetime.utcnow().strftime('%Y%m%d%H%M%S%f')}_{os.path.basename(audio_file)}"
         )
         try:
-            shutil.move(audio_file, unique_path)
             audio_file = unique_path
-            logger.debug(f"Moved to: {audio_file}")
         except Exception as e:
-            logger.error(f"Failed to move audio file: {str(e)}")
-            return f"Error: Failed to move audio file: {str(e)}"
         file_hash = compute_file_hash(audio_file)
         logger.info(f"Processing audio, Hash: {file_hash}")
@@ -249,25 +252,26 @@ def test_with_sample_audio():
     """Test with sample or synthetic audio."""
     temp_dir = os.path.join(tempfile.gettempdir(), "audio_samples")
     if not ensure_writable_dir(temp_dir):
-        logger.error(f"Temp directory {temp_dir} not writable")
-        return f"Error: Temp directory {temp_dir} not writable"
-    sample_audio_path = os.path.join(temp_dir, "sample.wav")
-    if not os.path.exists(sample_audio_path):
-        logger.warning("Sample audio not found; generating synthetic audio")
-        sr = 16000
-        t = np.linspace(0, 2, 2 * sr)
-        freq_mod = 440 + 10 * np.sin(2 * np.pi * 0.5 * t)
-        amplitude_mod = 0.5 + 0.1 * np.sin(2 * np.pi * 0.3 * t)
-        noise = 0.01 * np.random.normal(0, 1, len(t))
-        dummy_audio = amplitude_mod * np.sin(2 * np.pi * freq_mod * t) + noise
-        sample_audio_path = os.path.join(temp_dir, "dummy_test.wav")
-        try:
-            soundfile.write(dummy_audio, sr, sample_audio_path)
-            logger.info(f"Generated synthetic audio: {sample_audio_path}")
-        except Exception as e:
-            logger.error(f"Failed to write synthetic audio: {str(e)}")
-            return f"Error: Failed to generate synthetic audio: {str(e)}"
     if not os.path.exists(sample_audio_path):
         logger.error(f"Synthetic audio not created: {sample_audio_path}")

     try:
         model = pipeline(
             "automatic-speech-recognition",
+            model="openai/whisper-small.en",
             device=-1,  # CPU; use device=0 for GPU if available
             model_kwargs={"use_safetensors": True}
         )
+        logger.info("Whisper-small.en model loaded successfully")
         return model
     except Exception as e:
         logger.error(f"Failed to load Whisper model: {str(e)}")
         try:
             model = pipeline(
                 "text-classification",
+                model="allenai/scibert_scivocab_uncased",
                 device=-1
             )
+            logger.warning("Fallback to allenai/scibert_scivocab_uncased model")
             return model
         except Exception as fallback_e:
             logger.error(f"Fallback model failed: {str(fallback_e)}")
         temp_dir = os.path.join(tempfile.gettempdir(), "gradio")
         if not ensure_writable_dir(temp_dir):
+            fallback_dir = os.path.join(os.getcwd(), "temp_gradio")
+            if not ensure_writable_dir(fallback_dir):
+                logger.error(f"Both temp directories {temp_dir} and {fallback_dir} not writable")
+                return f"Error: Temp directories not writable"
+            temp_dir = fallback_dir
         if not os.path.exists(audio_file):
             logger.error(f"Audio file not found: {audio_file}")
             f"audio_{datetime.utcnow().strftime('%Y%m%d%H%M%S%f')}_{os.path.basename(audio_file)}"
         )
         try:
+            shutil.copy(audio_file, unique_path)
             audio_file = unique_path
+            logger.debug(f"Copied to: {audio_file}")
         except Exception as e:
+            logger.error(f"Failed to copy audio file: {str(e)}")
+            return f"Error: Failed to copy audio file: {str(e)}"
         file_hash = compute_file_hash(audio_file)
         logger.info(f"Processing audio, Hash: {file_hash}")
     """Test with sample or synthetic audio."""
     temp_dir = os.path.join(tempfile.gettempdir(), "audio_samples")
     if not ensure_writable_dir(temp_dir):
+        fallback_dir = os.path.join(os.getcwd(), "temp_audio_samples")
+        if not ensure_writable_dir(fallback_dir):
+            logger.error(f"Both temp directories {temp_dir} and {fallback_dir} not writable")
+            return f"Error: Temp directories not writable"
+        temp_dir = fallback_dir
+    sample_audio_path = os.path.join(temp_dir, "dummy_test.wav")
+    logger.info(f"Generating synthetic audio at: {sample_audio_path}")
+    sr = 16000
+    t = np.linspace(0, 2, 2 * sr)
+    freq_mod = 440 + 10 * np.sin(2 * np.pi * 0.5 * t)
+    amplitude_mod = 0.5 + 0.1 * np.sin(2 * np.pi * 0.3 * t)
+    noise = 0.01 * np.random.normal(0, 1, len(t))
+    dummy_audio = amplitude_mod * np.sin(2 * np.pi * freq_mod * t) + noise
+    try:
+        soundfile.write(dummy_audio, sr, sample_audio_path)
+        logger.info(f"Generated synthetic audio: {sample_audio_path}")
+    except Exception as e:
+        logger.error(f"Failed to write synthetic audio: {str(e)}")
+        return f"Error: Failed to generate synthetic audio: {str(e)}"
     if not os.path.exists(sample_audio_path):
         logger.error(f"Synthetic audio not created: {sample_audio_path}")