Spaces:

Cachoups
/

FinanceReport

Sleeping

App Files Files Community

Cachoups commited on Sep 20, 2024

Commit

d5ac762

verified ·

1 Parent(s): 3373145

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -31

app.py CHANGED Viewed

@@ -324,70 +324,106 @@ with gr.Blocks() as demo:
         - For the selected topic (sheet name), find related sentences in the associated PDF text that mention the topic, and classify them by sentiment.
         - For a selected country and topic, describe the adverse growth rate trend over three years using the [**google/flan-t5-base**](https://huggingface.co/google/flan-t5-base).
         """)
-    with gr.Tab("Financial Report Text Analysis"):
-        gr.Markdown("## Paragraph Extraction and Analysis on Adverse Macro-Economy Scenarios")
         with gr.Row():
             with gr.Column():
-                gr.Markdown("### Step 1: Upload and Extract Paragraphs")
                 pdf1 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 1")
                 pdf2 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 2")
-                extract_button = gr.Button("Extract Paragraphs")
             with gr.Column():
-                gr.Markdown("### Step 2: Select Paragraphs for Analysis")
                 paragraph_1_dropdown = gr.Dropdown(label="Select Paragraph from PDF 1")
                 paragraph_2_dropdown = gr.Dropdown(label="Select Paragraph from PDF 2")
                 def update_paragraphs(pdf1, pdf2):
                     stored_paragraphs_1, stored_paragraphs_2 = extract_and_paragraph(pdf1, pdf2, True)
-                    return [f"Paragraph {i+1}: {p[:100]}..." for i, p in enumerate(stored_paragraphs_1)], \
-                           [f"Paragraph {i+1}: {p[:100]}..." for i, p in enumerate(stored_paragraphs_2)]
-                extract_button.click(update_paragraphs, inputs=[pdf1, pdf2], outputs=[paragraph_1_dropdown, paragraph_2_dropdown])
         with gr.Row():
             with gr.Column():
                 gr.Markdown("### PDF 1 Analysis")
                 summarize_btn1 = gr.Button("Summarize Text from PDF 1")
                 summary_textbox_1 = gr.Textbox(label="Summary for PDF 1", lines=2)
                 sentiment_btn1 = gr.Button("Classify Financial Tone from PDF 1")
-                sentiment_textbox_1 = gr.Textbox(label="Tone Classification for PDF 1", lines=1)
-                summarize_btn1.click(process_paragraph_1_sum, inputs=paragraph_1_dropdown, outputs=summary_textbox_1)
-                sentiment_btn1.click(process_paragraph_1_sent, inputs=paragraph_1_dropdown, outputs=sentiment_textbox_1)
             with gr.Column():
                 gr.Markdown("### PDF 2 Analysis")
                 summarize_btn2 = gr.Button("Summarize Text from PDF 2")
                 summary_textbox_2 = gr.Textbox(label="Summary for PDF 2", lines=2)
                 sentiment_btn2 = gr.Button("Classify Financial Tone from PDF 2")
-                sentiment_textbox_2 = gr.Textbox(label="Tone Classification for PDF 2", lines=1)
-                summarize_btn2.click(process_paragraph_2_sum, inputs=paragraph_2_dropdown, outputs=summary_textbox_2)
-                sentiment_btn2.click(process_paragraph_2_sent, inputs=paragraph_2_dropdown, outputs=sentiment_textbox_2)
     with gr.Tab("Financial Report Table Analysis"):
-        gr.Markdown("## Excel Data Comparison and Topic Analysis")
         with gr.Row():
             with gr.Column():
-                gr.Markdown("### Step 1: Upload Excel Files")
                 file1 = gr.Dropdown(choices=get_excel_files(PDF_FOLDER), label="Select Excel File 1")
                 file2 = gr.Dropdown(choices=get_excel_files(PDF_FOLDER), label="Select Excel File 2")
-                sheet = gr.Dropdown(choices=["GDP", "HICP", "RRE prices", "Unemployment", "CRE prices"], label="Select Sheet")
             with gr.Column():
-                gr.Markdown("### Step 2: Select a Country for Adverse Growth Analysis")
                 country_1_dropdown = gr.Dropdown(label="Select Country from Excel File 1")
                 country_2_dropdown = gr.Dropdown(label="Select Country from Excel File 2")
-        with gr.Row():
-            gr.Markdown("### Step 3: Compare Data and Generate Reports")
-            comparison_button = gr.Button("Compare Data")
-            text_result_df1 = gr.Textbox(label="Adverse Growth Report for Excel File 1", lines=4)
-            text_result_df2 = gr.Textbox(label="Adverse Growth Report for Excel File 2", lines=4)
-            comparison_button.click(fn=process_and_compare, inputs=[file1, sheet, file2], outputs=[text_result_df1, text_result_df2])
-demo.launch()

         - For the selected topic (sheet name), find related sentences in the associated PDF text that mention the topic, and classify them by sentiment.
         - For a selected country and topic, describe the adverse growth rate trend over three years using the [**google/flan-t5-base**](https://huggingface.co/google/flan-t5-base).
         """)
+     with gr.Tab("Financial Report Text Analysis"):
+        gr.Markdown("## Financial Report Paragraph Selection and Analysis on adverse macro-economy scenario")
         with gr.Row():
+            # Upload PDFs
             with gr.Column():
                 pdf1 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 1")
                 pdf2 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 2")
             with gr.Column():
+                b1 = gr.Button("Extract and Display Paragraphs")
                 paragraph_1_dropdown = gr.Dropdown(label="Select Paragraph from PDF 1")
                 paragraph_2_dropdown = gr.Dropdown(label="Select Paragraph from PDF 2")
                 def update_paragraphs(pdf1, pdf2):
+                    global stored_paragraphs_1, stored_paragraphs_2
                     stored_paragraphs_1, stored_paragraphs_2 = extract_and_paragraph(pdf1, pdf2, True)
+                    updated_dropdown_1 = [f"Paragraph {i+1}: {p[:100]}..." for i, p in enumerate(stored_paragraphs_1)]
+                    updated_dropdown_2 = [f"Paragraph {i+1}: {p[:100]}..." for i, p in enumerate(stored_paragraphs_2)]
+                    return gr.update(choices=updated_dropdown_1), gr.update(choices=updated_dropdown_2)
+                b1.click(fn=update_paragraphs, inputs=[pdf1, pdf2], outputs=[paragraph_1_dropdown, paragraph_2_dropdown])
         with gr.Row():
+            # Process the selected paragraph from PDF 1
             with gr.Column():
                 gr.Markdown("### PDF 1 Analysis")
+                selected_paragraph_1 = gr.Textbox(label="Selected Paragraph 1 Content", lines=4)
                 summarize_btn1 = gr.Button("Summarize Text from PDF 1")
                 summary_textbox_1 = gr.Textbox(label="Summary for PDF 1", lines=2)
+                summarize_btn1.click(fn=lambda p: process_paragraph_1_sum(p), inputs=paragraph_1_dropdown, outputs=summary_textbox_1)
                 sentiment_btn1 = gr.Button("Classify Financial Tone from PDF 1")
+                sentiment_textbox_1 = gr.Textbox(label="Classification for PDF 1", lines=1)
+                sentiment_btn1.click(fn=lambda p: process_paragraph_1_sent(p), inputs=paragraph_1_dropdown, outputs=sentiment_textbox_1)
+                analyze_btn1 = gr.Button("Analyze Financial Tone on each sentence with yiyanghkust/finbert-tone")
+                fin_spans_1 = gr.HighlightedText(label="Financial Tone Analysis for PDF 1")
+                analyze_btn1.click(fn=lambda p: process_paragraph_1_sent_tone(p), inputs=paragraph_1_dropdown, outputs=fin_spans_1)
+                analyze_btn1_ = gr.Button("Analyze Financial Tone on each sentence with ProsusAI/finbert")
+                fin_spans_1_ = gr.HighlightedText(label="Financial Tone Analysis for PDF 1 bis")
+                analyze_btn1_.click(fn=lambda p: process_paragraph_1_sent_tone_bis(p), inputs=paragraph_1_dropdown, outputs=fin_spans_1_)
+            # Process the selected paragraph from PDF 2
             with gr.Column():
                 gr.Markdown("### PDF 2 Analysis")
+                selected_paragraph_2 = gr.Textbox(label="Selected Paragraph 2 Content", lines=4)
+                selected_paragraph_2.change(show, paragraph_2_dropdown, selected_paragraph_2)
                 summarize_btn2 = gr.Button("Summarize Text from PDF 2")
                 summary_textbox_2 = gr.Textbox(label="Summary for PDF 2", lines=2)
+                summarize_btn2.click(fn=lambda p: process_paragraph_2_sum(p), inputs=paragraph_2_dropdown, outputs=summary_textbox_2)
                 sentiment_btn2 = gr.Button("Classify Financial Tone from PDF 2")
+                sentiment_textbox_2 = gr.Textbox(label="Classification for PDF 2", lines=1)
+                sentiment_btn2.click(fn=lambda p: process_paragraph_2_sent(p), inputs=paragraph_2_dropdown, outputs=sentiment_textbox_2)
+                analyze_btn2 = gr.Button("Analyze Financial Tone on each sentence with yiyanghkust/finbert-tone")
+                fin_spans_2 = gr.HighlightedText(label="Financial Tone Analysis for PDF 2")
+                analyze_btn2.click(fn=lambda p: process_paragraph_2_sent_tone(p), inputs=paragraph_2_dropdown, outputs=fin_spans_2)
+                analyze_btn2_ = gr.Button("Analyze Financial Tone on each sentence with ProsusAI/finbert")
+                fin_spans_2_ = gr.HighlightedText(label="Financial Tone Analysis for PDF 2 bis")
+                analyze_btn2_.click(fn=lambda p: process_paragraph_2_sent_tone_bis(p), inputs=paragraph_2_dropdown, outputs=fin_spans_2_)
     with gr.Tab("Financial Report Table Analysis"):
+        # New tab content goes here
+        gr.Markdown("## Excel Data Comparison")
         with gr.Row():
             with gr.Column():
                 file1 = gr.Dropdown(choices=get_excel_files(PDF_FOLDER), label="Select Excel File 1")
                 file2 = gr.Dropdown(choices=get_excel_files(PDF_FOLDER), label="Select Excel File 2")
+                sheet = gr.Dropdown(choices=["GDP", "HICP", "RRE prices", "Unemployment", "CRE prices"], label="Select Sheet for File 1 and 2")
             with gr.Column():
+                result = gr.Image(label="Comparison pLot")
+        def update_sheets(file):
+            return get_sheet_names(file)
+        b1 = gr.Button("Compare Data")
+        b2 = gr.Button("Extract text information")
+        with gr.Row():
+            with gr.Column():
+                sentiment_results_pdf1 = gr.HighlightedText(label="Sentiment Analysis - PDF 1")
                 country_1_dropdown = gr.Dropdown(label="Select Country from Excel File 1")
+                summarize_btn1_country = gr.Button("Summary for the selected country")
+                text_result_df1 = gr.Textbox(label="Sentence for excel file 1", lines=2)
+                summarize_btn1_country.click(fn=lambda country, theme: generate_text(stored_df1, country, theme),
+                             inputs=[country_1_dropdown, sheet],
+                             outputs=text_result_df1)
+            with gr.Column():
+                sentiment_results_pdf2 = gr.HighlightedText(label="Sentiment Analysis - PDF 2")
                 country_2_dropdown = gr.Dropdown(label="Select Country from Excel File 2")
+                summarize_btn2_country = gr.Button("Summary for the selected country")
+                text_result_df2 = gr.Textbox(label="Sentence for excel file 2", lines=2)
+                summarize_btn2_country.click(fn=lambda country, theme: generate_text(stored_df2, country, theme),
+                             inputs=[country_2_dropdown, sheet],
+                             outputs=text_result_df2)
+        # Button to extract text from PDFs and perform sentiment analysis
+        b1.click(fn=process_and_compare, inputs=[file1, sheet, file2, sheet], outputs=[result,country_1_dropdown, country_2_dropdown])
+        b2.click(fn=process_pdfs_and_analyze_sentiment, inputs=[file1, file2, sheet], outputs=[sentiment_results_pdf1, sentiment_results_pdf2])
+demo.launch()