Spaces:

Lenylvt
/

SRT_Translation

Running

App Files Files Community

Lenylvt commited on Feb 16, 2024

Commit

2a618ec

verified ·

1 Parent(s): d112fe6

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -23

app.py CHANGED Viewed

@@ -1,20 +1,16 @@
-import io
-import os
-import requests
 import streamlit as st
 import pandas as pd
 import pysrt
 from transformers import MarianMTModel, MarianTokenizer
 import tempfile
-os.environ['CURL_CA_BUNDLE'] = ''
 def fetch_languages(url):
     response = requests.get(url)
     if response.status_code == 200:
-        # Convert bytes to a string using decode, then create a file-like object with io.StringIO
         csv_content = response.content.decode('utf-8')
-        df = pd.read_csv(io.StringIO(csv_content), delimiter="|", skiprows=2, header=None).dropna(axis=1, how='all')
         df.columns = ['ISO 639-1', 'ISO 639-2', 'Language Name', 'Native Name']
         df['ISO 639-1'] = df['ISO 639-1'].str.strip()
         language_options = [(row['ISO 639-1'], f"{row['ISO 639-1']} - {row['Language Name']}") for index, row in df.iterrows()]
@@ -42,19 +38,12 @@ def translate_text(text, source_language_code, target_language_code):
 def translate_srt(input_file, source_language_code, target_language_code):
     subs = pysrt.open(input_file)
     translated_subs = []
-    progress_bar = st.progress(0)
     for idx, sub in enumerate(subs):
         translated_text = translate_text(sub.text, source_language_code, target_language_code)
         translated_sub = pysrt.SubRipItem(index=idx+1, start=sub.start, end=sub.end, text=translated_text)
         translated_subs.append(translated_sub)
-        progress_bar.progress((idx + 1) / len(subs))
     translated_file = pysrt.SubRipFile(translated_subs)
-    # Use tempfile to create a temporary file path
-    with tempfile.NamedTemporaryFile(suffix=".srt", delete=False) as tmp_file:
-        translated_file.save(tmp_file.name)
-        translated_srt_path = tmp_file.name
-    progress_bar.empty()
-    return translated_srt_path
 st.title("SRT Translator")
 st.write("Translate subtitles from one language to another.")
@@ -63,14 +52,29 @@ st.write("Translate subtitles from one language to another.")
 url = "https://huggingface.co/Lenylvt/LanguageISO/resolve/main/iso.md"
 language_options = fetch_languages(url)
-source_language_code = st.selectbox("Select Source Language", options=language_options, format_func=lambda x: x[1])
-target_language_code = st.selectbox("Select Target Language", options=language_options, format_func=lambda x: x[1])
 file_input = st.file_uploader("Upload SRT File", type=["srt"])
-if file_input is not None:
-    with tempfile.NamedTemporaryFile(suffix=".srt", delete=False) as temp_file:
-        temp_file.write(file_input.read())
-        temp_file.seek(0)
-        translated_srt_path = translate_srt(temp_file.name, source_language_code, target_language_code)
-        st.success(f"Translation complete! You can download the translated SRT file from [here]({translated_srt_path})")

 import streamlit as st
 import pandas as pd
 import pysrt
 from transformers import MarianMTModel, MarianTokenizer
 import tempfile
+from io import BytesIO
+import requests
 def fetch_languages(url):
     response = requests.get(url)
     if response.status_code == 200:
         csv_content = response.content.decode('utf-8')
+        df = pd.read_csv(BytesIO(response.content), delimiter="|", skiprows=2, header=None).dropna(axis=1, how='all')
         df.columns = ['ISO 639-1', 'ISO 639-2', 'Language Name', 'Native Name']
         df['ISO 639-1'] = df['ISO 639-1'].str.strip()
         language_options = [(row['ISO 639-1'], f"{row['ISO 639-1']} - {row['Language Name']}") for index, row in df.iterrows()]
 def translate_srt(input_file, source_language_code, target_language_code):
     subs = pysrt.open(input_file)
     translated_subs = []
     for idx, sub in enumerate(subs):
         translated_text = translate_text(sub.text, source_language_code, target_language_code)
         translated_sub = pysrt.SubRipItem(index=idx+1, start=sub.start, end=sub.end, text=translated_text)
         translated_subs.append(translated_sub)
     translated_file = pysrt.SubRipFile(translated_subs)
+    return translated_file
 st.title("SRT Translator")
 st.write("Translate subtitles from one language to another.")
 url = "https://huggingface.co/Lenylvt/LanguageISO/resolve/main/iso.md"
 language_options = fetch_languages(url)
+source_language_code, target_language_code = None, None
+if language_options:
+    source_language_code = st.selectbox("Select Source Language", options=language_options, format_func=lambda x: x[1])[0]
+    target_language_code = st.selectbox("Select Target Language", options=language_options, format_func=lambda x: x[1])[0]
 file_input = st.file_uploader("Upload SRT File", type=["srt"])
+if file_input is not None and source_language_code and target_language_code:
+    translated_srt = translate_srt(file_input, source_language_code, target_language_code)
+    # Save the translated subtitles to an in-memory buffer
+    buffer = BytesIO()
+    translated_srt.save(buffer, encoding='utf-8')
+    buffer.seek(0)
+    # Convert the BytesIO buffer to bytes for the download button
+    translated_srt_bytes = buffer.getvalue()
+    # Create a download button and serve the translated subtitles as a downloadable file
+    st.download_button(
+        label="Download Translated SRT",
+        data=translated_srt_bytes,
+        file_name="translated_subtitles.srt",
+        mime="text/plain",
+    )