Spaces:

owiedotch
/

dac

Sleeping

App Files Files Community

owiedotch commited on Aug 25

Commit

0586f5f

•

1 Parent(s): f65c77c

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -3

app.py CHANGED Viewed

@@ -7,6 +7,16 @@ from dac_jax.audio_utils import volume_norm, db2linear
 import io
 import soundfile as sf
 import spaces
 # Load the DAC model with padding set to False for chunking
 model, variables = dac_jax.load_model(model_type="44khz", padding=False)
@@ -23,15 +33,20 @@ def decompress_chunk(c):
 @spaces.GPU
 def encode(audio_file):
     try:
-        # Load a mono audio file directly from BytesIO
-        signal, sample_rate = librosa.load(audio_file, sr=44100, mono=True)
         signal = jnp.array(signal, dtype=jnp.float32)
         while signal.ndim < 3:
             signal = jnp.expand_dims(signal, axis=0)
         # Set chunk duration based on available GPU memory (adjust as needed)
-        win_duration = 5.0  # Start with 5 seconds
         # Compress using chunking
         dac_file = model.compress(compress_chunk, signal, sample_rate, win_duration=win_duration)
@@ -46,6 +61,9 @@ def encode(audio_file):
     except Exception as e:
         gr.Warning(f"An error occurred during encoding: {e}")
         return None
 @spaces.GPU
 def decode(compressed_dac_file):

 import io
 import soundfile as sf
 import spaces
+import tempfile
+import os
+# Check for CUDA availability and set device
+try:
+    import jax.tools.colab_tpu
+    jax.tools.colab_tpu.setup_tpu()
+    print("Connected to TPU")
+except:
+    print("No TPU detected, using GPU or CPU.")
 # Load the DAC model with padding set to False for chunking
 model, variables = dac_jax.load_model(model_type="44khz", padding=False)
 @spaces.GPU
 def encode(audio_file):
     try:
+        # Save the uploaded audio to a temporary file
+        with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_audio_file:
+            temp_audio_file.write(audio_file.read())
+            temp_audio_file_path = temp_audio_file.name
+        # Load a mono audio file from the temporary file path
+        signal, sample_rate = librosa.load(temp_audio_file_path, sr=44100, mono=True)
         signal = jnp.array(signal, dtype=jnp.float32)
         while signal.ndim < 3:
             signal = jnp.expand_dims(signal, axis=0)
         # Set chunk duration based on available GPU memory (adjust as needed)
+        win_duration = 5.0
         # Compress using chunking
         dac_file = model.compress(compress_chunk, signal, sample_rate, win_duration=win_duration)
     except Exception as e:
         gr.Warning(f"An error occurred during encoding: {e}")
         return None
+    finally:
+        # Clean up the temporary file
+        os.remove(temp_audio_file_path)
 @spaces.GPU
 def decode(compressed_dac_file):