Spaces:

pelinbalci
/

LanguageDetection

Sleeping

pelinbalci commited on May 21, 2023

Commit

5372fcc

•

1 Parent(s): 19f568a

initial commit

Files changed (4) hide show

main.py ADDED Viewed

+import streamlit as st
+import json
+import requests
+from model import predict_pipeline
+st.title("Language Detection Model")
+st.write("")
+st.write("Supported Languages:")
+col1, col2, col3, col4 = st.columns(4)
+with col1:
+    st.markdown("- Arabic")
+    st.markdown("- Danish")
+    st.markdown("- Dutch")
+    st.markdown("- English")
+    st.markdown("- French")
+with col2:
+    st.markdown("- German")
+    st.markdown("- Greek")
+    st.markdown("- Hindi")
+    st.markdown("- Italian")
+with col3:
+    st.markdown("- Kannada")
+    st.markdown("- Malayalam")
+    st.markdown("- Portugeese")
+    st.markdown("- Russian")
+with col4:
+    st.markdown("- Spanish")
+    st.markdown("- Sweedish")
+    st.markdown("- Tamil")
+    st.markdown("- Turkish")
+st.markdown('''
+<style>
+[data-testid="stMarkdownContainer"] ul{
+    list-style-position: inside;
+}
+</style>
+''', unsafe_allow_html=True)
+title = st.text_input('Input text', 'Please enter the text here')
+st.write('The current text is', title)
+inputs = {"text": title}
+if st.button("Detect Language"):
+    language = predict_pipeline(json.dumps(inputs))
+    st.write(f'Language: {language}')

model.py ADDED Viewed

+import pickle
+import re
+from pathlib import Path
+__version__ = "0.1.0"
+BASE_DIR = Path(__file__).resolve(strict=True).parent
+with open(f"{BASE_DIR}/trained_pipeline-{__version__}.pkl", "rb") as f:
+    model = pickle.load(f)
+classes = [
+    "Arabic",
+    "Danish",
+    "Dutch",
+    "English",
+    "French",
+    "German",
+    "Greek",
+    "Hindi",
+    "Italian",
+    "Kannada",
+    "Malayalam",
+    "Portugeese",
+    "Russian",
+    "Spanish",
+    "Sweedish",
+    "Tamil",
+    "Turkish",
+]
+def predict_pipeline(text):
+    text = re.sub(r'[!@#$(),\n"%^*?\:;~`0-9]', " ", text)
+    text = re.sub(r"[[]]", " ", text)
+    text = text.lower()
+    pred = model.predict([text])
+    return classes[pred[0]]

requirements.txt ADDED Viewed

+streamlit==1.22.0
+requests==2.30.0
+scikit-learn==1.2.2

trained_pipeline-0.1.0.pkl ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0894da01a3536140440401b6623cb33fd13d6e9791129bf5830d3e0b57a22d16
+size 9982945