Spaces:

kambris
/

SoLProject

Runtime error

App Files Files Community

kambris commited on Nov 26, 2024

Commit

e9be7bd

verified ·

1 Parent(s): e8e9aaf

Update app.py

Browse files

Files changed (1) hide show

app.py +2 -11

app.py CHANGED Viewed

@@ -14,7 +14,6 @@ import pkg_resources
 current_dir = os.path.dirname(os.path.abspath(__file__))
 font_path = os.path.join(current_dir, "ArabicR2013-J25x.ttf")
-# Add Arabic stop words
 ARABIC_STOP_WORDS = {
     'في', 'من', 'إلى', 'على', 'عن', 'مع', 'خلال', 'حتى', 'إذا', 'ثم',
     'أو', 'و', 'ف', 'ل', 'ب', 'ك', 'لل', 'ال', 'هذا', 'هذه', 'ذلك',
@@ -31,7 +30,7 @@ ARABIC_STOP_WORDS = {
     'اول', 'ضمن', 'انها', 'جميع', 'الذي', 'قبل', 'بعد', 'حول', 'ايضا',
     'لازم', 'حاجة', 'علي', 'يجب', 'صار', 'صارت', 'تحت', 'ضد'
     }
-# Configure page
 st.set_page_config(
     page_title="Arabic Poem Analysis",
     page_icon="📚",
@@ -250,7 +249,6 @@ def process_and_summarize(df, bert_tokenizer, bert_model, emotion_classifier, to
         embedding_model=bert_model,
         **topic_model_params)
-    # Create vectorizer with stop words
     vectorizer = CountVectorizer(stop_words=list(ARABIC_STOP_WORDS),
                                 min_df=1,
                                 max_df=1.0)
@@ -316,7 +314,7 @@ def process_and_summarize(df, bert_tokenizer, bert_model, emotion_classifier, to
             continue
     return summaries, topic_model
-# Load models
 try:
     bert_tokenizer, bert_model, emotion_classifier = load_models()
     st.success("Models loaded successfully!")
@@ -328,28 +326,23 @@ except Exception as e:
 st.title("📚 Arabic Poem Analysis")
 st.write("Upload a CSV or Excel file containing Arabic poems with columns `country` and `poem`.")
-# File upload
 uploaded_file = st.file_uploader("Choose a file", type=["csv", "xlsx"])
 if uploaded_file is not None:
     try:
-        # Read the file
         if uploaded_file.name.endswith('.csv'):
             df = pd.read_csv(uploaded_file)
         else:
             df = pd.read_excel(uploaded_file)
-        # Validate columns
         required_columns = ['country', 'poem']
         if not all(col in df.columns for col in required_columns):
             st.error("File must contain 'country' and 'poem' columns.")
             st.stop()
-        # Clean data
         df['country'] = df['country'].str.strip()
         df = df.dropna(subset=['country', 'poem'])
-        # Add topic modeling controls
         st.subheader("Topic Modeling Settings")
         col1, col2 = st.columns(2)
@@ -404,7 +397,6 @@ if uploaded_file is not None:
                 if summaries:
                     st.success("Analysis complete!")
-                    # Display results in tabs
                     tab1, tab2 = st.tabs(["Country Summaries", "Global Topics"])
                     with tab1:
@@ -445,7 +437,6 @@ if uploaded_file is not None:
 else:
     st.info("👆 Upload a file to get started!")
-    # Example format
     st.write("### Expected File Format:")
     example_df = pd.DataFrame({
         'country': ['Egypt', 'Palestine'],

 current_dir = os.path.dirname(os.path.abspath(__file__))
 font_path = os.path.join(current_dir, "ArabicR2013-J25x.ttf")
 ARABIC_STOP_WORDS = {
     'في', 'من', 'إلى', 'على', 'عن', 'مع', 'خلال', 'حتى', 'إذا', 'ثم',
     'أو', 'و', 'ف', 'ل', 'ب', 'ك', 'لل', 'ال', 'هذا', 'هذه', 'ذلك',
     'اول', 'ضمن', 'انها', 'جميع', 'الذي', 'قبل', 'بعد', 'حول', 'ايضا',
     'لازم', 'حاجة', 'علي', 'يجب', 'صار', 'صارت', 'تحت', 'ضد'
     }
 st.set_page_config(
     page_title="Arabic Poem Analysis",
     page_icon="📚",
         embedding_model=bert_model,
         **topic_model_params)
     vectorizer = CountVectorizer(stop_words=list(ARABIC_STOP_WORDS),
                                 min_df=1,
                                 max_df=1.0)
             continue
     return summaries, topic_model
 try:
     bert_tokenizer, bert_model, emotion_classifier = load_models()
     st.success("Models loaded successfully!")
 st.title("📚 Arabic Poem Analysis")
 st.write("Upload a CSV or Excel file containing Arabic poems with columns `country` and `poem`.")
 uploaded_file = st.file_uploader("Choose a file", type=["csv", "xlsx"])
 if uploaded_file is not None:
     try:
         if uploaded_file.name.endswith('.csv'):
             df = pd.read_csv(uploaded_file)
         else:
             df = pd.read_excel(uploaded_file)
         required_columns = ['country', 'poem']
         if not all(col in df.columns for col in required_columns):
             st.error("File must contain 'country' and 'poem' columns.")
             st.stop()
         df['country'] = df['country'].str.strip()
         df = df.dropna(subset=['country', 'poem'])
         st.subheader("Topic Modeling Settings")
         col1, col2 = st.columns(2)
                 if summaries:
                     st.success("Analysis complete!")
                     tab1, tab2 = st.tabs(["Country Summaries", "Global Topics"])
                     with tab1:
 else:
     st.info("👆 Upload a file to get started!")
     st.write("### Expected File Format:")
     example_df = pd.DataFrame({
         'country': ['Egypt', 'Palestine'],