snac_test2

Sleeping

App Files Files Community

Gapeleon commited on Apr 5

Commit

ff11e39

verified ·

1 Parent(s): d54f19d

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -9

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ except ImportError as e:
     raise ImportError("Could not import SNAC. Make sure 'snac' is listed in requirements.txt and installed correctly.") from e
 # --- Configuration ---
-TARGET_SR = 24000 # SNAC operates at 24kHz
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {DEVICE}")
@@ -26,7 +26,7 @@ snac_model = None
 try:
     print("Loading SNAC model...")
     start_time = time.time()
-    snac_model = SNAC.from_pretrained("hubertsiuzdak/snac_24khz")
     snac_model = snac_model.to(DEVICE)
     snac_model.eval() # Set model to evaluation mode
     end_time = time.time()
@@ -80,7 +80,7 @@ def process_audio(audio_filepath):
             waveform_to_encode = resampler(original_waveform)
             logs.append(f"Resampling complete. New Shape: {waveform_to_encode.shape}")
         else:
-            logs.append("Waveform is already at the target sample rate (24kHz).")
             waveform_to_encode = original_waveform
         resample_end = time.time()
         logs.append(f"Resampling time: {resample_end - resample_start:.2f}s")
@@ -141,12 +141,12 @@ def process_audio(audio_filepath):
 # --- Gradio Interface ---
 DESCRIPTION = """
-This Space demonstrates the **SNAC (Scalable Neural Audio Codec)** model (`hubertsiuzdak/snac_24khz`).
 1. Upload an audio file (wav, mp3, flac, etc.).
-2. The audio will be automatically resampled to 24kHz if needed.
-3. The 24kHz audio is encoded into discrete codes by SNAC.
 4. These codes are then decoded back into audio by SNAC.
-5. You can listen to the original, the 24kHz version (if resampled), and the final reconstructed audio.
 **Note:** Processing happens on the server. Larger files will take longer. If the input is stereo, only the first channel is processed.
 """
@@ -156,11 +156,11 @@ iface = gr.Interface(
     inputs=gr.Audio(type="filepath", label="Upload Audio File"),
     outputs=[
         gr.Audio(label="Original Audio"),
-        gr.Audio(label="Resampled Audio (24kHz Input to SNAC)"),
         gr.Audio(label="Reconstructed Audio (Output from SNAC)"),
         gr.Textbox(label="Log Output", lines=15)
     ],
-    title="SNAC Audio Codec Demo (24kHz)",
     description=DESCRIPTION,
     examples=[
         # Add paths to example audio files if you upload some to your Space repo

     raise ImportError("Could not import SNAC. Make sure 'snac' is listed in requirements.txt and installed correctly.") from e
 # --- Configuration ---
+TARGET_SR = 32000 # SNAC operates at 32kHz
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {DEVICE}")
 try:
     print("Loading SNAC model...")
     start_time = time.time()
+    snac_model = SNAC.from_pretrained("hubertsiuzdak/snac_32khz")
     snac_model = snac_model.to(DEVICE)
     snac_model.eval() # Set model to evaluation mode
     end_time = time.time()
             waveform_to_encode = resampler(original_waveform)
             logs.append(f"Resampling complete. New Shape: {waveform_to_encode.shape}")
         else:
+            logs.append("Waveform is already at the target sample rate (32kHz).")
             waveform_to_encode = original_waveform
         resample_end = time.time()
         logs.append(f"Resampling time: {resample_end - resample_start:.2f}s")
 # --- Gradio Interface ---
 DESCRIPTION = """
+This Space demonstrates the **SNAC (Scalable Neural Audio Codec)** model (`hubertsiuzdak/snac_32khz`).
 1. Upload an audio file (wav, mp3, flac, etc.).
+2. The audio will be automatically resampled to 32kHz if needed.
+3. The 32kHz audio is encoded into discrete codes by SNAC.
 4. These codes are then decoded back into audio by SNAC.
+5. You can listen to the original, the 32kHz version (if resampled), and the final reconstructed audio.
 **Note:** Processing happens on the server. Larger files will take longer. If the input is stereo, only the first channel is processed.
 """
     inputs=gr.Audio(type="filepath", label="Upload Audio File"),
     outputs=[
         gr.Audio(label="Original Audio"),
+        gr.Audio(label="Resampled Audio (32kHz Input to SNAC)"),
         gr.Audio(label="Reconstructed Audio (Output from SNAC)"),
         gr.Textbox(label="Log Output", lines=15)
     ],
+    title="SNAC Audio Codec Demo (32kHz)",
     description=DESCRIPTION,
     examples=[
         # Add paths to example audio files if you upload some to your Space repo