Spaces:

arad1367
/

Text_To_Speech_App_5_Languages

Running

App Files Files Community

arad1367 commited on Sep 16

Commit

f17813b

•

1 Parent(s): 3ba5689

Upload 2 files

Browse files

Files changed (2) hide show

app.py +74 -0
requirements.txt +66 -0

app.py ADDED Viewed

	@@ -0,0 +1,74 @@

+import gradio as gr
+from gtts import gTTS
+from pdfplumber import open as pp_open
+import os
+def convert_pdf_to_speech(pdf, language):
+    """
+    This function takes in a PDF file and converts it to speech.
+    Parameters:
+    pdf (str): The path to the PDF file.
+    language (str): The language of the text.
+    Returns:
+    A message stating that the PDF has been converted to speech.
+    """
+    # Extract text from our pdf
+    pdf_content = ""
+    with pp_open(pdf) as pdf_file:
+        for page in pdf_file.pages:
+            pdf_content += page.extract_text()
+    # Convert pdf to speech and make AudioBook!
+    tts = gTTS(text=pdf_content, lang=language)
+    filename = os.path.basename(pdf)
+    filename = f"{filename.split('.')[0]}.mp3"
+    tts.save(filename)
+    return f"Your PDF has been converted to speech. The MP3 file is saved as {os.path.abspath(filename)}"
+demo = gr.Blocks(theme='gradio/soft')
+with demo:
+    # App description
+    with gr.Column():
+        gr.Markdown("<b>PDF Text-to-Speech Converter</b>")
+        gr.Markdown("Convert your PDF files to audio books")
+    # Input for the PDF
+    pdf_input = gr.File(label="Select a PDF", type="filepath")
+    # Language selector
+    language_selector = gr.Dropdown(
+        label="Language",
+        value="en",
+        choices=["en", "es", "de", "it", "fr"],
+        interactive=True,
+    )
+    # Button to start the conversion process
+    button = gr.Button("Convert PDF to Speech")
+    # Output message
+    output = gr.Textbox(label="Output")
+    with gr.Column():
+        # Footer with links to LinkedIn, GitHub and Live demo of PhD defense
+        footer_html = """
+<div style="text-align: center; margin-top: 20px;">
+    <a href="https://www.linkedin.com/in/pejman-ebrahimi-4a60151a7/" target="_blank">LinkedIn</a> |
+    <a href="https://github.com/arad1367" target="_blank">GitHub</a> |
+    <a href="https://arad1367.pythonanywhere.com/" target="_blank">Live demo of my PhD defense</a>
+    <br>
+    Made with 💖 by Pejman Ebrahimi
+</div>
+"""
+        gr.HTML(footer_html)
+    # Layout the components
+    button.click(convert_pdf_to_speech, inputs=[pdf_input, language_selector], outputs=output)
+demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,66 @@

+aiofiles==23.2.1
+annotated-types==0.7.0
+anyio==4.4.0
+certifi==2024.8.30
+cffi==1.17.1
+charset-normalizer==3.3.2
+click==8.1.7
+colorama==0.4.6
+contourpy==1.3.0
+cryptography==43.0.1
+cycler==0.12.1
+exceptiongroup==1.2.2
+fastapi==0.114.2
+ffmpy==0.4.0
+filelock==3.16.0
+fonttools==4.53.1
+fsspec==2024.9.0
+gradio==4.44.0
+gradio_client==1.3.0
+gTTS==2.5.3
+h11==0.14.0
+httpcore==1.0.5
+httpx==0.27.2
+huggingface-hub==0.24.7
+idna==3.10
+importlib_resources==6.4.5
+Jinja2==3.1.4
+kiwisolver==1.4.7
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib==3.9.2
+mdurl==0.1.2
+numpy==2.1.1
+orjson==3.10.7
+packaging==24.1
+pandas==2.2.2
+pdfminer.six==20231228
+pdfplumber==0.11.4
+pillow==10.4.0
+pycparser==2.22
+pydantic==2.9.1
+pydantic_core==2.23.3
+pydub==0.25.1
+Pygments==2.18.0
+pyparsing==3.1.4
+pypdfium2==4.30.0
+python-dateutil==2.9.0.post0
+python-multipart==0.0.9
+pytz==2024.2
+PyYAML==6.0.2
+requests==2.32.3
+rich==13.8.1
+ruff==0.6.5
+semantic-version==2.10.0
+shellingham==1.5.4
+six==1.16.0
+sniffio==1.3.1
+starlette==0.38.5
+tomlkit==0.12.0
+tqdm==4.66.5
+typer==0.12.5
+typing_extensions==4.12.2
+tzdata==2024.1
+urllib3==2.2.3
+uvicorn==0.30.6
+websockets==12.0