Spaces:

Politrees
/

Steganography

Running

App Files Files Community

Politrees commited on Oct 4, 2024

Commit

5145c3f

verified ·

1 Parent(s): d0a2403

Update steganography.py

Browse files

Files changed (1) hide show

steganography.py +34 -71

steganography.py CHANGED Viewed

@@ -5,23 +5,24 @@ import librosa
 import librosa.display
 import gradio as gr
 import soundfile as sf
-import os
 # Function for creating a spectrogram image with text
 def text_to_spectrogram_image(text, base_width=512, height=256, max_font_size=80, margin=10, letter_spacing=5):
-    font_path = "/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf"
-    if os.path.exists(font_path):
-        font = ImageFont.truetype(font_path, max_font_size)
-    else:
         font = ImageFont.load_default()
     image = Image.new('L', (base_width, height), 'black')
     draw = ImageDraw.Draw(image)
-    text_width = 0
-    for char in text:
-        text_bbox = draw.textbbox((0, 0), char, font=font)
-        text_width += text_bbox[2] - text_bbox[0] + letter_spacing
-    text_width -= letter_spacing
     if text_width + margin * 2 > base_width:
         width = text_width + margin * 2
@@ -30,20 +31,21 @@ def text_to_spectrogram_image(text, base_width=512, height=256, max_font_size=80
     image = Image.new('L', (width, height), 'black')
     draw = ImageDraw.Draw(image)
     text_x = (width - text_width) // 2
-    text_y = (height - (text_bbox[3] - text_bbox[1])) // 2
     for char in text:
         draw.text((text_x, text_y), char, font=font, fill='white')
         char_bbox = draw.textbbox((0, 0), char, font=font)
         text_x += char_bbox[2] - char_bbox[0] + letter_spacing
     image = np.array(image)
     image = np.where(image > 0, 255, image)
     return image
 # Converting an image to audio
-def spectrogram_image_to_audio(image, sr=22050):
     flipped_image = np.flipud(image)
     S = flipped_image.astype(np.float32) / 255.0 * 100.0
     y = librosa.griffinlim(S)
@@ -54,19 +56,21 @@ def create_audio_with_spectrogram(text, base_width, height, max_font_size, margi
     spec_image = text_to_spectrogram_image(text, base_width, height, max_font_size, margin, letter_spacing)
     y = spectrogram_image_to_audio(spec_image)
     audio_path = 'output.wav'
-    sf.write(audio_path, y, 22050)
     image_path = 'spectrogram.png'
     plt.imsave(image_path, spec_image, cmap='gray')
     return audio_path, image_path
 # Function for displaying the spectrogram of an audio file
 def display_audio_spectrogram(audio_path):
-    y, sr = librosa.load(audio_path)
     S = librosa.feature.melspectrogram(y=y, sr=sr)
     S_dB = librosa.power_to_db(S, ref=np.max)
     plt.figure(figsize=(10, 4))
-    librosa.display.specshow(S_dB)
     plt.tight_layout()
     spectrogram_path = 'uploaded_spectrogram.png'
@@ -75,7 +79,7 @@ def display_audio_spectrogram(audio_path):
     return spectrogram_path
 # Converting a downloaded image to an audio spectrogram
-def image_to_spectrogram_audio(image_path, sr=22050):
     image = Image.open(image_path).convert('L')
     image = np.array(image)
     y = spectrogram_image_to_audio(image, sr)
@@ -84,36 +88,8 @@ def image_to_spectrogram_audio(image_path, sr=22050):
     return img2audio_path
 # Gradio interface
-with gr.Blocks(title='Audio Steganography', theme=gr.themes.Soft(primary_hue="green", secondary_hue="green", spacing_size="sm", radius_size="lg")) as iface:
-    with gr.Group():
-        with gr.Row(variant='panel'):
-            with gr.Column():
-                gr.HTML("<center><h2><a href='https://t.me/pol1trees'>Telegram Channel</a></h2></center>")
-            with gr.Column():
-                gr.HTML("<center><h2><a href='https://t.me/+GMTP7hZqY0E4OGRi'>Telegram Chat</a></h2></center>")
-            with gr.Column():
-                gr.HTML("<center><h2><a href='https://www.youtube.com/channel/UCHb3fZEVxUisnqLqCrEM8ZA'>YouTube</a></h2></center>")
-            with gr.Column():
-                gr.HTML("<center><h2><a href='https://github.com/Bebra777228/Audio-Steganography'>GitHub</a></h2></center>")
-    with gr.Tab("INFO"):
-        with gr.Column(variant='panel'):
-            with gr.Group():
-                gr.HTML("<center><h2>Ha-Ha-Ha, I'm laughing at you.</h2></center>")
-                gr.HTML("<center><h2>People, before using this interface, read about what Steganography is.</h2></center>")
-                gr.HTML("<center><h2><b>Steganography is not Stable Diffusion and not Suno, why are you trying to generate images and music here?</b></h2></center>")
-        with gr.Column(variant='panel'):
-            with gr.Group():
-                gr.HTML("<center><h1><b>Steganography is a method of hiding information within other information or a physical object in such a way that it cannot be detected. Using steganography, you can hide almost any digital content, including texts, images, audio, and video files.</b></h2></center>")
-                gr.HTML("<center><h1><b>In this interface, steganography is used to hide text or an image in the spectrogram of an sound.</b></h1></center>")
-        with gr.Column(variant='panel'):
-            with gr.Group():
-                gr.Image(value="https://huggingface.co/spaces/Politrees/Audio-Steganography/resolve/main/content/1.jpg", show_label=False, show_share_button=False, show_download_button=False)
-                gr.Image(value="https://huggingface.co/spaces/Politrees/Audio-Steganography/resolve/main/content/2.jpg", show_label=False, show_share_button=False, show_download_button=False)
     with gr.Tab("Text to Spectrogram"):
-        gr.HTML("<center><h2>Oh my god people, learn to read. Go to the “INFO” tab, it says what this interface is and what it is for, don't be idiots.</h2></center>")
         with gr.Group():
             text = gr.Textbox(lines=2, placeholder="Enter your text:", label="Text")
             with gr.Row(variant='panel'):
@@ -123,7 +99,7 @@ with gr.Blocks(title='Audio Steganography', theme=gr.themes.Soft(primary_hue="gr
                 margin = gr.Slider(minimum=0, maximum=50, step=1, value=10, label="Indent")
                 letter_spacing = gr.Slider(minimum=0, maximum=50, step=1, value=5, label="Letter spacing")
             generate_button = gr.Button("Generate")
         with gr.Column(variant='panel'):
             with gr.Group():
                 output_audio = gr.Audio(type="filepath", label="Generated audio")
@@ -132,48 +108,35 @@ with gr.Blocks(title='Audio Steganography', theme=gr.themes.Soft(primary_hue="gr
         def gradio_interface_fn(text, base_width, height, max_font_size, margin, letter_spacing):
             print("\n", text)
             return create_audio_with_spectrogram(text, base_width, height, max_font_size, margin, letter_spacing)
-        generate_button.click(
-            gradio_interface_fn,
-            inputs=[text, base_width, height, max_font_size, margin, letter_spacing],
-            outputs=[output_audio, output_image]
-        )
     with gr.Tab("Image to Spectrogram"):
-        gr.HTML("<center><h2>Oh my god people, learn to read. Go to the “INFO” tab, it says what this interface is and what it is for, don't be idiots.</h2></center>")
         with gr.Group():
             with gr.Row(variant='panel'):
                 upload_image = gr.Image(type="filepath", label="Upload image")
                 convert_button = gr.Button("Convert to audio")
             with gr.Column(variant='panel'):
                 output_audio_from_image = gr.Audio(type="filepath", label="Generated audio")
             def gradio_image_to_audio_fn(upload_image):
                 return image_to_spectrogram_audio(upload_image)
-            convert_button.click(
-                gradio_image_to_audio_fn,
-                inputs=[upload_image],
-                outputs=[output_audio_from_image]
-            )
     with gr.Tab("Audio Spectrogram"):
         with gr.Group():
             with gr.Row(variant='panel'):
                 upload_audio = gr.Audio(type="filepath", label="Upload audio", scale=3)
                 decode_button = gr.Button("Show spectrogram", scale=2)
             with gr.Column(variant='panel'):
                 decoded_image = gr.Image(type="filepath", label="Audio Spectrogram")
             def gradio_decode_fn(upload_audio):
                 return display_audio_spectrogram(upload_audio)
-            decode_button.click(
-                gradio_decode_fn,
-                inputs=[upload_audio],
-                outputs=[decoded_image]
-            )
-iface.launch(share=True)

 import librosa.display
 import gradio as gr
 import soundfile as sf
+# Constants
+DEFAULT_FONT_PATH = "/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf"
+DEFAULT_SAMPLE_RATE = 22050
 # Function for creating a spectrogram image with text
 def text_to_spectrogram_image(text, base_width=512, height=256, max_font_size=80, margin=10, letter_spacing=5):
+    try:
+        font = ImageFont.truetype(DEFAULT_FONT_PATH, max_font_size)
+    except IOError:
+        print(f"Font not found at {DEFAULT_FONT_PATH}. Using default font.")
         font = ImageFont.load_default()
     image = Image.new('L', (base_width, height), 'black')
     draw = ImageDraw.Draw(image)
+    text_width = sum(draw.textbbox((0, 0), char, font=font)[2] - draw.textbbox((0, 0), char, font=font)[0] + letter_spacing for char in text) - letter_spacing
+    text_height = draw.textbbox((0, 0), text[0], font=font)[3] - draw.textbbox((0, 0), text[0], font=font)[1]
     if text_width + margin * 2 > base_width:
         width = text_width + margin * 2
     image = Image.new('L', (width, height), 'black')
     draw = ImageDraw.Draw(image)
     text_x = (width - text_width) // 2
+    text_y = (height - text_height) // 2
     for char in text:
         draw.text((text_x, text_y), char, font=font, fill='white')
         char_bbox = draw.textbbox((0, 0), char, font=font)
         text_x += char_bbox[2] - char_bbox[0] + letter_spacing
     image = np.array(image)
     image = np.where(image > 0, 255, image)
     return image
 # Converting an image to audio
+def spectrogram_image_to_audio(image, sr=DEFAULT_SAMPLE_RATE):
     flipped_image = np.flipud(image)
     S = flipped_image.astype(np.float32) / 255.0 * 100.0
     y = librosa.griffinlim(S)
     spec_image = text_to_spectrogram_image(text, base_width, height, max_font_size, margin, letter_spacing)
     y = spectrogram_image_to_audio(spec_image)
     audio_path = 'output.wav'
+    sf.write(audio_path, y, DEFAULT_SAMPLE_RATE)
     image_path = 'spectrogram.png'
     plt.imsave(image_path, spec_image, cmap='gray')
     return audio_path, image_path
 # Function for displaying the spectrogram of an audio file
 def display_audio_spectrogram(audio_path):
+    y, sr = librosa.load(audio_path, sr=None)
     S = librosa.feature.melspectrogram(y=y, sr=sr)
     S_dB = librosa.power_to_db(S, ref=np.max)
     plt.figure(figsize=(10, 4))
+    librosa.display.specshow(S_dB, sr=sr, x_axis='time', y_axis='mel')
+    plt.colorbar(format='%+2.0f dB')
+    plt.title('Mel-frequency spectrogram')
     plt.tight_layout()
     spectrogram_path = 'uploaded_spectrogram.png'
     return spectrogram_path
 # Converting a downloaded image to an audio spectrogram
+def image_to_spectrogram_audio(image_path, sr=DEFAULT_SAMPLE_RATE):
     image = Image.open(image_path).convert('L')
     image = np.array(image)
     y = spectrogram_image_to_audio(image, sr)
     return img2audio_path
 # Gradio interface
+with gr.Blocks(title='Audio Steganography', theme=gr.themes.Soft(primary_hue="green", secondary_hue="green", spacing_size="sm", radius_size="lg")) as txt2spec:
     with gr.Tab("Text to Spectrogram"):
         with gr.Group():
             text = gr.Textbox(lines=2, placeholder="Enter your text:", label="Text")
             with gr.Row(variant='panel'):
                 margin = gr.Slider(minimum=0, maximum=50, step=1, value=10, label="Indent")
                 letter_spacing = gr.Slider(minimum=0, maximum=50, step=1, value=5, label="Letter spacing")
             generate_button = gr.Button("Generate")
         with gr.Column(variant='panel'):
             with gr.Group():
                 output_audio = gr.Audio(type="filepath", label="Generated audio")
         def gradio_interface_fn(text, base_width, height, max_font_size, margin, letter_spacing):
             print("\n", text)
             return create_audio_with_spectrogram(text, base_width, height, max_font_size, margin, letter_spacing)
+        generate_button.click(gradio_interface_fn, inputs=[text, base_width, height, max_font_size, margin, letter_spacing], outputs=[output_audio, output_image])
     with gr.Tab("Image to Spectrogram"):
         with gr.Group():
             with gr.Row(variant='panel'):
                 upload_image = gr.Image(type="filepath", label="Upload image")
                 convert_button = gr.Button("Convert to audio")
             with gr.Column(variant='panel'):
                 output_audio_from_image = gr.Audio(type="filepath", label="Generated audio")
             def gradio_image_to_audio_fn(upload_image):
                 return image_to_spectrogram_audio(upload_image)
+            convert_button.click(gradio_image_to_audio_fn, inputs=[upload_image], outputs=[output_audio_from_image])
     with gr.Tab("Audio Spectrogram"):
         with gr.Group():
             with gr.Row(variant='panel'):
                 upload_audio = gr.Audio(type="filepath", label="Upload audio", scale=3)
                 decode_button = gr.Button("Show spectrogram", scale=2)
             with gr.Column(variant='panel'):
                 decoded_image = gr.Image(type="filepath", label="Audio Spectrogram")
             def gradio_decode_fn(upload_audio):
                 return display_audio_spectrogram(upload_audio)
+            decode_button.click(gradio_decode_fn, inputs=[upload_audio], outputs=[decoded_image])
+txt2spec.launch(share=True)