Spaces:

walaa2022
/

financial_analysis

Sleeping

App Files Files Community

walaa2022 commited on Dec 5, 2024

Commit

cd3edfb

verified ·

1 Parent(s): db53aac

Update app.py

Browse files

Files changed (1) hide show

app.py +106 -66

app.py CHANGED Viewed

@@ -25,9 +25,7 @@ class FinancialAnalyzer:
         """Clean and convert numerical values"""
         try:
             if isinstance(value, str):
-                # Remove currency symbols, commas, spaces
                 value = value.replace('$', '').replace(',', '').strip()
-                # Handle parentheses for negative numbers
                 if '(' in value and ')' in value:
                     value = '-' + value.replace('(', '').replace(')', '')
             return float(value or 0)
@@ -39,7 +37,6 @@ class FinancialAnalyzer:
         try:
             with open(file_path, 'r') as f:
                 content = f.read()
-            # Simple check for Markdown structure
             return any(line.startswith('#') or '|' in line for line in content.split('\n'))
         except:
             return False
@@ -60,14 +57,13 @@ class FinancialAnalyzer:
                     current_table = []
                     headers = None
                 elif '|' in line:
-                    if '-|-' not in line:  # Skip separator lines
                         row = [cell.strip() for cell in line.split('|')[1:-1]]
                         if not headers:
                             headers = row
                         else:
                             current_table.append(row)
-            # Process last table
             if current_table and headers:
                 data[current_section] = self.process_table(headers, current_table)
@@ -91,69 +87,122 @@ class FinancialAnalyzer:
             print(f"Error processing table: {str(e)}")
             return {}
     def extract_metrics(self, income_data, balance_data):
         """Extract and calculate key financial metrics"""
         try:
-            # Get current and previous year values for growth calculations
             metrics = {
-            "Revenue": {
-                "2025": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2025"),
-                "2024": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2024"),
-                "2021": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2021")
-            },
-            "Profitability": {
-                "Gross_Profit_2025": self.get_nested_value(income_data, "Cost and Gross Profit", "Gross Profit", "2025"),
-                "EBIT_2025": self.get_nested_value(income_data, "Profit Summary", "EBIT", "2025"),
-                "Net_Earnings_2025": self.get_nested_value(income_data, "Profit Summary", "Net Earnings", "2025"),
-                "Operating_Expenses_2025": self.get_nested_value(income_data, "Operating Expenses", "Total Operating Expenses", "2025")
-            },
-            "Balance_Sheet": {
-                "Total_Assets_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Assets", "2025"),
-                "Current_Assets_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Current_Assets", "2025"),
-                "Total_Liabilities_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Liabilities", "2025"),
-                "Current_Liabilities_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Current_Liabilities", "2025"),
-                "Equity_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Shareholders_Equity", "2025"),
-                "Inventory_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Inventory", "2025"),
-                "Accounts_Receivable_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Accounts_Receivable", "2025"),
-                "Long_Term_Debt_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Long_Term_Debt", "2025")
-            },
-            "Cash_Flow": {
-                "Depreciation_2025": self.get_nested_value(income_data, "Operating Expenses", "Depreciation & Amortization", "2025"),
-                "Interest_Expense_2025": self.get_nested_value(income_data, "Profit Summary", "Interest Expense", "2025")
             }
-        }
-        # Calculate financial ratios
             revenue_2025 = metrics["Revenue"]["2025"]
             if revenue_2025 != 0:
-            # Profitability Ratios
                 metrics["Ratios"] = {
-                "Gross_Margin": (metrics["Profitability"]["Gross_Profit_2025"] / revenue_2025) * 100,
-                "Operating_Margin": (metrics["Profitability"]["EBIT_2025"] / revenue_2025) * 100,
-                "Net_Margin": (metrics["Profitability"]["Net_Earnings_2025"] / revenue_2025) * 100,
-                # Liquidity Ratios
-                "Current_Ratio": metrics["Balance_Sheet"]["Current_Assets_2025"] / metrics["Balance_Sheet"]["Current_Liabilities_2025"],
-                "Quick_Ratio": (metrics["Balance_Sheet"]["Current_Assets_2025"] - metrics["Balance_Sheet"]["Inventory_2025"]) / metrics["Balance_Sheet"]["Current_Liabilities_2025"],
-                # Efficiency Ratios
-                "Asset_Turnover": revenue_2025 / metrics["Balance_Sheet"]["Total_Assets_2025"],
-                "Receivables_Turnover": revenue_2025 / metrics["Balance_Sheet"]["Accounts_Receivable_2025"],
-                # Solvency Ratios
-                "Debt_to_Equity": metrics["Balance_Sheet"]["Total_Liabilities_2025"] / metrics["Balance_Sheet"]["Equity_2025"],
-                "Interest_Coverage": metrics["Profitability"]["EBIT_2025"] / metrics["Cash_Flow"]["Interest_Expense_2025"] if metrics["Cash_Flow"]["Interest_Expense_2025"] != 0 else 0,
-                # Growth Rates
-                "Revenue_Growth": ((metrics["Revenue"]["2025"] / metrics["Revenue"]["2024"]) - 1) * 100,
-                "5Year_Revenue_CAGR": ((metrics["Revenue"]["2025"] / metrics["Revenue"]["2021"]) ** (1/4) - 1) * 100
                 }
             return metrics
         except Exception as e:
             print(f"Error extracting metrics: {str(e)}")
             return {}
     def generate_analysis(self, prompt):
         """Generate analysis using TinyLlama"""
         try:
@@ -161,7 +210,7 @@ class FinancialAnalyzer:
             outputs = self.model.generate(
                 inputs["input_ids"],
-                max_new_tokens=800,  # Increased from 500 to 800 for more detailed analysis
                 temperature=0.7,
                 top_p=0.9,
                 do_sample=True,
@@ -170,7 +219,6 @@ class FinancialAnalyzer:
             )
             analysis = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
-            # Clean up the response
             analysis = analysis.split("<human>")[-1].strip()
             return analysis
         except Exception as e:
@@ -179,28 +227,20 @@ class FinancialAnalyzer:
     def analyze_financials(self, balance_sheet_file, income_stmt_file):
         """Main analysis function"""
         try:
-            # Validate files
             if not (self.is_valid_markdown(balance_sheet_file) and self.is_valid_markdown(income_stmt_file)):
                 return "Error: One or both files are invalid or not in Markdown format."
-            # Read files
             with open(balance_sheet_file, 'r') as f:
                 balance_sheet = f.read()
             with open(income_stmt_file, 'r') as f:
                 income_stmt = f.read()
-            # Parse financial data
             income_data = self.parse_financial_data(income_stmt)
             balance_data = self.parse_financial_data(balance_sheet)
-            # Extract key metrics
             metrics = self.extract_metrics(income_data, balance_data)
-            # Generate and get analysis
-            prompt = self.generate_analysis_prompt(metrics)
             analysis = self.generate_analysis(prompt)
-            # Prepare results
             results = {
                 "Financial Analysis": {
                     "Key Metrics": metrics,
@@ -233,4 +273,4 @@ def create_interface():
 if __name__ == "__main__":
     iface = create_interface()
-    iface.launch()

         """Clean and convert numerical values"""
         try:
             if isinstance(value, str):
                 value = value.replace('$', '').replace(',', '').strip()
                 if '(' in value and ')' in value:
                     value = '-' + value.replace('(', '').replace(')', '')
             return float(value or 0)
         try:
             with open(file_path, 'r') as f:
                 content = f.read()
             return any(line.startswith('#') or '|' in line for line in content.split('\n'))
         except:
             return False
                     current_table = []
                     headers = None
                 elif '|' in line:
+                    if '-|-' not in line:
                         row = [cell.strip() for cell in line.split('|')[1:-1]]
                         if not headers:
                             headers = row
                         else:
                             current_table.append(row)
             if current_table and headers:
                 data[current_section] = self.process_table(headers, current_table)
             print(f"Error processing table: {str(e)}")
             return {}
+    def get_nested_value(self, data, section, key, year):
+        """Safely get nested dictionary value"""
+        try:
+            return data.get(section, {}).get(key, {}).get(str(year), 0)
+        except:
+            return 0
     def extract_metrics(self, income_data, balance_data):
         """Extract and calculate key financial metrics"""
         try:
             metrics = {
+                "Revenue": {
+                    "2025": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2025"),
+                    "2024": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2024"),
+                    "2021": self.get_nested_value(income_data, "Revenue", "Total Net Revenue", "2021")
+                },
+                "Profitability": {
+                    "Gross_Profit_2025": self.get_nested_value(income_data, "Cost and Gross Profit", "Gross Profit", "2025"),
+                    "EBIT_2025": self.get_nested_value(income_data, "Profit Summary", "EBIT", "2025"),
+                    "Net_Earnings_2025": self.get_nested_value(income_data, "Profit Summary", "Net Earnings", "2025"),
+                    "Operating_Expenses_2025": self.get_nested_value(income_data, "Operating Expenses", "Total Operating Expenses", "2025")
+                },
+                "Balance_Sheet": {
+                    "Total_Assets_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Assets", "2025"),
+                    "Current_Assets_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Current_Assets", "2025"),
+                    "Total_Liabilities_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Liabilities", "2025"),
+                    "Current_Liabilities_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Current_Liabilities", "2025"),
+                    "Equity_2025": self.get_nested_value(balance_data, "Key Totals", "Total_Shareholders_Equity", "2025"),
+                    "Inventory_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Inventory", "2025"),
+                    "Accounts_Receivable_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Accounts_Receivable", "2025"),
+                    "Long_Term_Debt_2025": self.get_nested_value(balance_data, "Balance Sheet Data 2021-2025", "Long_Term_Debt", "2025")
+                },
+                "Cash_Flow": {
+                    "Depreciation_2025": self.get_nested_value(income_data, "Operating Expenses", "Depreciation & Amortization", "2025"),
+                    "Interest_Expense_2025": self.get_nested_value(income_data, "Profit Summary", "Interest Expense", "2025")
+                }
             }
             revenue_2025 = metrics["Revenue"]["2025"]
             if revenue_2025 != 0:
                 metrics["Ratios"] = {
+                    "Gross_Margin": (metrics["Profitability"]["Gross_Profit_2025"] / revenue_2025) * 100,
+                    "Operating_Margin": (metrics["Profitability"]["EBIT_2025"] / revenue_2025) * 100,
+                    "Net_Margin": (metrics["Profitability"]["Net_Earnings_2025"] / revenue_2025) * 100,
+                    "Current_Ratio": metrics["Balance_Sheet"]["Current_Assets_2025"] / metrics["Balance_Sheet"]["Current_Liabilities_2025"] if metrics["Balance_Sheet"]["Current_Liabilities_2025"] != 0 else 0,
+                    "Quick_Ratio": (metrics["Balance_Sheet"]["Current_Assets_2025"] - metrics["Balance_Sheet"]["Inventory_2025"]) / metrics["Balance_Sheet"]["Current_Liabilities_2025"] if metrics["Balance_Sheet"]["Current_Liabilities_2025"] != 0 else 0,
+                    "Asset_Turnover": revenue_2025 / metrics["Balance_Sheet"]["Total_Assets_2025"] if metrics["Balance_Sheet"]["Total_Assets_2025"] != 0 else 0,
+                    "Receivables_Turnover": revenue_2025 / metrics["Balance_Sheet"]["Accounts_Receivable_2025"] if metrics["Balance_Sheet"]["Accounts_Receivable_2025"] != 0 else 0,
+                    "Debt_to_Equity": metrics["Balance_Sheet"]["Total_Liabilities_2025"] / metrics["Balance_Sheet"]["Equity_2025"] if metrics["Balance_Sheet"]["Equity_2025"] != 0 else 0,
+                    "Interest_Coverage": metrics["Profitability"]["EBIT_2025"] / metrics["Cash_Flow"]["Interest_Expense_2025"] if metrics["Cash_Flow"]["Interest_Expense_2025"] != 0 else 0,
+                    "Revenue_Growth": ((metrics["Revenue"]["2025"] / metrics["Revenue"]["2024"]) - 1) * 100 if metrics["Revenue"]["2024"] != 0 else 0,
+                    "5Year_Revenue_CAGR": ((metrics["Revenue"]["2025"] / metrics["Revenue"]["2021"]) ** (1/4) - 1) * 100 if metrics["Revenue"]["2021"] != 0 else 0
                 }
             return metrics
         except Exception as e:
             print(f"Error extracting metrics: {str(e)}")
             return {}
+    def generate_prompt(self, metrics):
+        """Create analysis prompt from metrics"""
+        try:
+            return f"""<human>
+Please provide a comprehensive financial analysis for 2025 with detailed insights on:
+1. Revenue and Growth:
+   - Total Revenue: ${metrics['Revenue']['2025']:,.1f}M
+   - YoY Growth Rate: {metrics['Ratios'].get('Revenue_Growth', 0):,.1f}%
+   - 5-Year CAGR: {metrics['Ratios'].get('5Year_Revenue_CAGR', 0):,.1f}%
+2. Profitability Analysis:
+   - Gross Profit: ${metrics['Profitability']['Gross_Profit_2025']:,.1f}M
+   - EBIT: ${metrics['Profitability']['EBIT_2025']:,.1f}M
+   - Net Earnings: ${metrics['Profitability']['Net_Earnings_2025']:,.1f}M
+   - Margin Analysis:
+     * Gross Margin: {metrics['Ratios'].get('Gross_Margin', 0):,.1f}%
+     * Operating Margin: {metrics['Ratios'].get('Operating_Margin', 0):,.1f}%
+     * Net Margin: {metrics['Ratios'].get('Net_Margin', 0):,.1f}%
+3. Balance Sheet Strength:
+   - Total Assets: ${metrics['Balance_Sheet']['Total_Assets_2025']:,.1f}M
+   - Total Liabilities: ${metrics['Balance_Sheet']['Total_Liabilities_2025']:,.1f}M
+   - Shareholders' Equity: ${metrics['Balance_Sheet']['Equity_2025']:,.1f}M
+4. Key Financial Ratios:
+   - Liquidity:
+     * Current Ratio: {metrics['Ratios'].get('Current_Ratio', 0):,.2f}
+     * Quick Ratio: {metrics['Ratios'].get('Quick_Ratio', 0):,.2f}
+   - Efficiency:
+     * Asset Turnover: {metrics['Ratios'].get('Asset_Turnover', 0):,.2f}
+     * Receivables Turnover: {metrics['Ratios'].get('Receivables_Turnover', 0):,.2f}
+   - Solvency:
+     * Debt-to-Equity: {metrics['Ratios'].get('Debt_to_Equity', 0):,.2f}
+     * Interest Coverage: {metrics['Ratios'].get('Interest_Coverage', 0):,.2f}
+Please provide:
+1. An assessment of overall financial health and performance trends
+2. Key strengths and potential areas of concern
+3. Analysis of operational efficiency and working capital management
+4. Evaluation of capital structure and debt management
+5. Specific recommendations for:
+   - Improving operational efficiency
+   - Optimizing capital structure
+   - Enhancing shareholder value
+   - Managing key risks identified
+Include quantitative support for your analysis and recommendations.
+</human>"""
+        except Exception as e:
+            print(f"Error generating prompt: {str(e)}")
+            return ""
     def generate_analysis(self, prompt):
         """Generate analysis using TinyLlama"""
         try:
             outputs = self.model.generate(
                 inputs["input_ids"],
+                max_new_tokens=800,
                 temperature=0.7,
                 top_p=0.9,
                 do_sample=True,
             )
             analysis = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
             analysis = analysis.split("<human>")[-1].strip()
             return analysis
         except Exception as e:
     def analyze_financials(self, balance_sheet_file, income_stmt_file):
         """Main analysis function"""
         try:
             if not (self.is_valid_markdown(balance_sheet_file) and self.is_valid_markdown(income_stmt_file)):
                 return "Error: One or both files are invalid or not in Markdown format."
             with open(balance_sheet_file, 'r') as f:
                 balance_sheet = f.read()
             with open(income_stmt_file, 'r') as f:
                 income_stmt = f.read()
             income_data = self.parse_financial_data(income_stmt)
             balance_data = self.parse_financial_data(balance_sheet)
             metrics = self.extract_metrics(income_data, balance_data)
+            prompt = self.generate_prompt(metrics)
             analysis = self.generate_analysis(prompt)
             results = {
                 "Financial Analysis": {
                     "Key Metrics": metrics,
 if __name__ == "__main__":
     iface = create_interface()
+    iface.launch()