Update app.py
Browse files
app.py
CHANGED
@@ -73,15 +73,8 @@ def translate_text(text, source_lang, target_lang):
|
|
73 |
return translated_text
|
74 |
|
75 |
# Summarization function with multi-language support
|
76 |
-
def summarize_text(text,
|
77 |
-
|
78 |
-
target_lang_code = LANGUAGES[target_language]
|
79 |
-
|
80 |
-
# If the input language is not English, translate to English
|
81 |
-
if source_lang_code != "en_XX":
|
82 |
-
text = translate_text(text, source_lang_code, "en_XX")
|
83 |
-
|
84 |
-
# Summarize the text using mBART
|
85 |
inputs = multilingual_summarization_tokenizer(text, return_tensors='pt', padding=True, truncation=True)
|
86 |
summary_ids = multilingual_summarization_model.generate(
|
87 |
inputs['input_ids'],
|
@@ -93,6 +86,8 @@ def summarize_text(text, source_language="English", target_language="English"):
|
|
93 |
)
|
94 |
summary = multilingual_summarization_tokenizer.decode(summary_ids[0], skip_special_tokens=True)
|
95 |
|
|
|
|
|
96 |
# Translate summary to the target language if needed
|
97 |
if target_lang_code != "en_XX":
|
98 |
summary = translate_text(summary, "en_XX", target_lang_code)
|
@@ -102,13 +97,12 @@ def summarize_text(text, source_language="English", target_language="English"):
|
|
102 |
# Streamlit interface
|
103 |
st.title("Multi-Language Text Summarization Tool")
|
104 |
|
105 |
-
text = st.text_area("Input Text")
|
106 |
-
|
107 |
-
target_language = st.selectbox("Target Language", options=list(LANGUAGES.keys()), index=list(LANGUAGES.keys()).index("English"))
|
108 |
|
109 |
if st.button("Summarize"):
|
110 |
if text:
|
111 |
-
summary = summarize_text(text,
|
112 |
st.subheader("Summary")
|
113 |
st.write(summary)
|
114 |
else:
|
|
|
73 |
return translated_text
|
74 |
|
75 |
# Summarization function with multi-language support
|
76 |
+
def summarize_text(text, target_language="English"):
|
77 |
+
# Summarize the text using mBART (assuming input text is in English)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
78 |
inputs = multilingual_summarization_tokenizer(text, return_tensors='pt', padding=True, truncation=True)
|
79 |
summary_ids = multilingual_summarization_model.generate(
|
80 |
inputs['input_ids'],
|
|
|
86 |
)
|
87 |
summary = multilingual_summarization_tokenizer.decode(summary_ids[0], skip_special_tokens=True)
|
88 |
|
89 |
+
target_lang_code = LANGUAGES[target_language]
|
90 |
+
|
91 |
# Translate summary to the target language if needed
|
92 |
if target_lang_code != "en_XX":
|
93 |
summary = translate_text(summary, "en_XX", target_lang_code)
|
|
|
97 |
# Streamlit interface
|
98 |
st.title("Multi-Language Text Summarization Tool")
|
99 |
|
100 |
+
text = st.text_area("Input Text (in English)")
|
101 |
+
target_language = st.selectbox("Target Language for Summary", options=list(LANGUAGES.keys()), index=list(LANGUAGES.keys()).index("English"))
|
|
|
102 |
|
103 |
if st.button("Summarize"):
|
104 |
if text:
|
105 |
+
summary = summarize_text(text, target_language)
|
106 |
st.subheader("Summary")
|
107 |
st.write(summary)
|
108 |
else:
|