Spaces:

owiedotch
/

dac

Sleeping

App Files Files Community

owiedotch commited on Aug 26

Commit

bd40662

•

1 Parent(s): a2cc897

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -3

app.py CHANGED Viewed

@@ -9,6 +9,10 @@ import soundfile as sf
 import spaces
 import tempfile
 import os
 # Check for CUDA availability and set device
 try:
@@ -32,6 +36,7 @@ def decompress_chunk(c):
 @spaces.GPU
 def encode(audio_file_path):
     try:
         # Load a mono audio file directly from the file path
         signal, sample_rate = librosa.load(audio_file_path, sr=44100, mono=True)
@@ -41,16 +46,20 @@ def encode(audio_file_path):
             signal = jnp.expand_dims(signal, axis=0)
         # Set chunk duration based on available GPU memory (adjust as needed)
-        win_duration = 5.0
         # Compress using chunking
         dac_file = model.compress(compress_chunk, signal, sample_rate, win_duration=win_duration)
         # Save the compressed DAC file to a temporary file
         with tempfile.NamedTemporaryFile(delete=False, suffix=".dac") as temp_file:
             dac_file.save(temp_file.name)
-        return temp_file.name
     except Exception as e:
         gr.Warning(f"An error occurred during encoding: {e}")
@@ -66,7 +75,7 @@ def decode(compressed_dac_file):
         y = model.decompress(decompress_chunk, dac_file)
         # Convert to numpy array and squeeze to remove extra dimensions
-        decoded_audio = jnp.array(y).squeeze()
         return (44100, decoded_audio)  # Return sample rate and audio data
@@ -74,6 +83,13 @@ def decode(compressed_dac_file):
         gr.Warning(f"An error occurred during decoding: {e}")
         return None
 # Gradio interface
 with gr.Blocks() as demo:
     gr.Markdown("<h1 style='text-align: center;'>Audio Compression with DAC-JAX</h1>")
@@ -86,6 +102,7 @@ with gr.Blocks() as demo:
             encoded_output = gr.File(label="Compressed Audio (.dac)")
         encode_button.click(encode, inputs=audio_input, outputs=encoded_output)
     with gr.Tab("Decode"):
         with gr.Row():

 import spaces
 import tempfile
 import os
+import numpy as np
+# Global variable to store the temporary file path
+temp_file_path = None
 # Check for CUDA availability and set device
 try:
 @spaces.GPU
 def encode(audio_file_path):
+    global temp_file_path
     try:
         # Load a mono audio file directly from the file path
         signal, sample_rate = librosa.load(audio_file_path, sr=44100, mono=True)
             signal = jnp.expand_dims(signal, axis=0)
         # Set chunk duration based on available GPU memory (adjust as needed)
+        win_duration = 10.0
         # Compress using chunking
         dac_file = model.compress(compress_chunk, signal, sample_rate, win_duration=win_duration)
         # Save the compressed DAC file to a temporary file
+        if temp_file_path:
+            os.remove(temp_file_path)  # Remove the previous temporary file if it exists
         with tempfile.NamedTemporaryFile(delete=False, suffix=".dac") as temp_file:
             dac_file.save(temp_file.name)
+            temp_file_path = temp_file.name
+        return temp_file_path
     except Exception as e:
         gr.Warning(f"An error occurred during encoding: {e}")
         y = model.decompress(decompress_chunk, dac_file)
         # Convert to numpy array and squeeze to remove extra dimensions
+        decoded_audio = np.array(y).squeeze()
         return (44100, decoded_audio)  # Return sample rate and audio data
         gr.Warning(f"An error occurred during decoding: {e}")
         return None
+def cleanup(audio_file_path):
+    global temp_file_path
+    if temp_file_path and os.path.exists(temp_file_path):
+        os.remove(temp_file_path)
+        temp_file_path = None
+    return None
 # Gradio interface
 with gr.Blocks() as demo:
     gr.Markdown("<h1 style='text-align: center;'>Audio Compression with DAC-JAX</h1>")
             encoded_output = gr.File(label="Compressed Audio (.dac)")
         encode_button.click(encode, inputs=audio_input, outputs=encoded_output)
+        encoded_output.change(cleanup, inputs=[audio_input], outputs=None)
     with gr.Tab("Decode"):
         with gr.Row():