Spaces:

AnilNiraula
/

FinChat

Running

App Files Files Community

AnilNiraula commited on Jul 9

Commit

f7cc8c3

verified ·

1 Parent(s): 948f3a8

Update app.py

Browse files

Files changed (1) hide show

app.py +312 -1

app.py CHANGED Viewed

@@ -192,4 +192,315 @@ try:
     logger.info(f"Successfully loaded model: {model_name}")
 except Exception as e:
     logger.error(f"Error loading model/tokenizer: {e}")
-    raise RuntimeError(f"Failed

     logger.info(f"Successfully loaded model: {model_name}")
 except Exception as e:
     logger.error(f"Error loading model/tokenizer: {e}")
+    raise RuntimeError(f"Failed to load model: {str(e)}")
+# Prompt prefix
+prompt_prefix = (
+    "You are FinChat, a financial advisor with expertise in stock market performance. Provide detailed, numbered list advice with clear reasoning for investing prompts, "
+    "including precise historical data when relevant (e.g., TSLA or S&P 500 returns for specific years or periods). For investment return queries, use compound interest calculations "
+    "based on historical averages. Avoid repetition and incomplete answers. Explain why each step or choice is beneficial.\n\n"
+    "Example 1:\n"
+    "Q: What is the S&P 500’s average annual return?\n"
+    "A: The S&P 500’s average annual return is ~10–12% over the long term (1927–2025), including dividends.\n"
+    "1. This reflects historical data adjusted for inflation and dividends.\n"
+    "2. Returns vary yearly (e.g., 16.3% in 2020) due to market conditions.\n"
+    "3. ETFs like SPY track this index for broad market exposure.\n\n"
+    "Example 2:\n"
+    "Q: What will $5,000 be worth in 10 years if invested in TSLA?\n"
+    "A: Assuming a 10% average annual return, a $5,000 investment in TSLA would grow to approximately $12,974 in 10 years with annual compounding.\n"
+    "1. This uses the historical average return of 10–12% for stocks.\n"
+    "2. Future returns vary and are not guaranteed.\n\n"
+    "Example 3:\n"
+    "Q: What was the average annual return of MSFT between 2010 and 2020?\n"
+    "A: The MSFT average annual return from 2010 to 2020 was approximately 16.8%, including dividends.\n"
+    "1. This period includes strong growth in tech stocks.\n"
+    "2. Dividends contribute significantly to total returns.\n\n"
+    "Q: "
+)
+prefix_tokens = tokenizer(prompt_prefix, return_tensors="pt", truncation=True, max_length=512).to(device)
+# Substring matching for cache
+def get_closest_cache_key(message, cache_keys):
+    message = message.lower().strip()
+    matches = difflib.get_close_matches(message, cache_keys, n=1, cutoff=0.8)
+    return matches[0] if matches else None
+# Parse period from user input
+def parse_period(query):
+    query = query.lower()
+    # Match symbol (TSLA, MSFT, NVDA, GOOG, AMZN, S&P 500)
+    symbol_match = re.search(r'(tsla|msft|nvda|goog|amzn|s&p\s*500)', query)
+    symbol = symbol_match.group(1).upper() if symbol_match else "SPY"
+    if symbol == "S&P 500":
+        symbol = "SPY"
+    # Match specific year ranges
+    match = re.search(r'(?:between|from)\s*(\d{4})\s*(?:and|to|-|–)\s*(\d{4})', query)
+    if match:
+        start_year, end_year = map(int, match.groups())
+        if start_year <= end_year:
+            return start_year, end_year, None, symbol
+    # Match duration-based queries
+    match = re.search(r'(\d+)-year.*from\s*(\d{4})', query)
+    if match:
+        duration, start_year = map(int, match.groups())
+        end_year = start_year + duration - 1
+        return start_year, end_year, duration, symbol
+    # Match past X years
+    match = re.search(r'(?:past\s*(\d+)-year|\b(\d+)-year.*(?:return|growth\s*rate))', query)
+    if match:
+        duration = int(match.group(1) or match.group(2))
+        max_year = df_yearly['Year'].max() if df_yearly is not None else 2025
+        start_year = max_year - duration + 1
+        end_year = max_year
+        return start_year, end_year, duration, symbol
+    # Match single year
+    match = re.search(r'return\s*(?:in|for)\s*(\d{4})', query)
+    if match:
+        year = int(match.group(1))
+        return year, year, 1, symbol
+    return None, None, None, symbol
+# Calculate average growth rate
+def calculate_growth_rate(start_year, end_year, duration=None, symbol="SPY"):
+    if df_yearly is None or start_year is None or end_year is None:
+        return None, "Data not available or invalid period."
+    df_period = df_yearly[(df_yearly['Year'] >= start_year) & (df_yearly['Year'] <= end_year)]
+    if df_period.empty:
+        return None, f"No data available for {symbol} from {start_year} to {end_year}."
+    avg_return = df_period[f"Return_{symbol}"].mean()
+    if np.isnan(avg_return):
+        return None, f"Insufficient data for {symbol} from {start_year} to {end_year}."
+    symbol_name = "S&P 500" if symbol == "SPY" else symbol
+    if duration == 1 and start_year == end_year:
+        response = f"The {symbol_name} returned approximately {avg_return:.1f}% in {start_year}, including dividends."
+    elif duration:
+        response = f"The {symbol_name} {duration}-year average annual return from {start_year} to {end_year} was approximately {avg_return:.1f}%, including dividends."
+    else:
+        response = f"The {symbol_name} average annual return from {start_year} to {end_year} was approximately {avg_return:.1f}%, including dividends."
+    return avg_return, response
+# Parse investment return query
+def parse_investment_query(query):
+    match = re.search(r'\$(\d+).*\s(\d+)\s*years?.*\b(tsla|msft|nvda|goog|amzn|s&p\s*500)\b', query, re.IGNORECASE)
+    if match:
+        amount = float(match.group(1))
+        years = int(match.group(2))
+        symbol = match.group(3).upper()
+        if symbol == "S&P 500":
+            symbol = "SPY"
+        return amount, years, symbol
+    return None, None, None
+# Calculate future value
+def calculate_future_value(amount, years, symbol):
+    if df_yearly is None or amount is None or years is None:
+        return None, "Data not available or invalid input."
+    avg_annual_return = 10.0
+    future_value = amount * (1 + avg_annual_return / 100) ** years
+    symbol_name = "S&P 500" if symbol == "SPY" else symbol
+    return future_value, (
+        f"Assuming a 10% average annual return, a ${amount:,.0f} investment in {symbol_name} would grow to approximately ${future_value:,.0f} "
+        f"in {years} years with annual compounding. This is based on the historical average return of 10–12% for stocks. "
+        "Future returns vary and are not guaranteed. Consult a financial planner."
+    )
+# Chat function
+def chat_with_model(user_input, history=None, is_processing=False):
+    try:
+        start_time = time.time()
+        logger.info(f"Processing user input: {user_input}")
+        is_processing = True
+        logger.info("Showing loading animation")
+        # Normalize and check cache
+        cache_key = user_input.lower().strip()
+        cache_keys = list(response_cache.keys())
+        closest_key = cache_key if cache_key in response_cache else get_closest_cache_key(cache_key, cache_keys)
+        if closest_key:
+            logger.info(f"Cache hit for: {closest_key}")
+            response = response_cache[closest_key]
+            logger.info(f"Chatbot response: {response}")
+            history = history or []
+            history.append({"role": "user", "content": user_input})
+            history.append({"role": "assistant", "content": response})
+            end_time = time.time()
+            logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+            return response, history, False, ""
+        # Check for investment return query
+        amount, years, symbol = parse_investment_query(user_input)
+        if amount and years:
+            future_value, response = calculate_future_value(amount, years, symbol)
+            if future_value is not None:
+                response_cache[cache_key] = response
+                logger.info(f"Investment query: ${amount} for {years} years in {symbol}, added to cache")
+                logger.info(f"Chatbot response: {response}")
+                history = history or []
+                history.append({"role": "user", "content": user_input})
+                history.append({"role": "assistant", "content": response})
+                end_time = time.time()
+                logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+                return response, history, False, ""
+        # Check for period-specific query
+        start_year, end_year, duration, symbol = parse_period(user_input)
+        if start_year and end_year:
+            avg_return, response = calculate_growth_rate(start_year, end_year, duration, symbol)
+            if avg_return is not None:
+                response_cache[cache_key] = response
+                logger.info(f"Dynamic period query for {symbol}: {start_year}–{end_year}, added to cache")
+                logger.info(f"Chatbot response: {response}")
+                history = history or []
+                history.append({"role": "user", "content": user_input})
+                history.append({"role": "assistant", "content": response})
+                end_time = time.time()
+                logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+                return response, history, False, ""
+        # Handle short prompts
+        if len(user_input.strip()) <= 5:
+            logger.info("Short prompt, returning default response")
+            response = "Hello! I'm FinChat, your financial advisor. Ask about investing in TSLA, MSFT, NVDA, GOOG, AMZN, or S&P 500!"
+            logger.info(f"Chatbot response: {response}")
+            history = history or []
+            history.append({"role": "user", "content": user_input})
+            history.append({"role": "assistant", "content": response})
+            end_time = time.time()
+            logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+            return response, history, False, ""
+        # Construct and generate response
+        full_prompt = prompt_prefix + user_input + "\nA:"
+        try:
+            inputs = tokenizer(full_prompt, return_tensors="pt", truncation=True, max_length=512).to(device)
+        except Exception as e:
+            logger.error(f"Error tokenizing input: {e}")
+            response = f"Error: Failed to process input: {str(e)}"
+            logger.info(f"Chatbot response: {response}")
+            history = history or []
+            history.append({"role": "user", "content": user_input})
+            history.append({"role": "assistant", "content": response})
+            end_time = time.time()
+            logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+            return response, history, False, ""
+        with torch.inference_mode():
+            logger.info("Generating response with model")
+            gen_start_time = time.time()
+            outputs = model.generate(
+                **inputs,
+                max_new_tokens=40,
+                min_length=20,
+                do_sample=False,
+                repetition_penalty=2.0,
+                pad_token_id=tokenizer.eos_token_id
+            )
+            gen_end_time = time.time()
+            logger.info(f"Generation time: {gen_end_time - gen_start_time:.2f} seconds")
+        response = tokenizer.decode(outputs[0], skip_special_tokens=True)
+        response = response[len(full_prompt):].strip() if response.startswith(full_prompt) else response
+        logger.info(f"Chatbot response: {response}")
+        # Update cache
+        response_cache[cache_key] = response
+        logger.info("Cache miss, added to in-memory cache")
+        # Update history
+        history = history or []
+        history.append({"role": "user", "content": user_input})
+        history.append({"role": "assistant", "content": response})
+        torch.cuda.empty_cache()
+        end_time = time.time()
+        logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+        return response, history, False, ""
+    except Exception as e:
+        logger.error(f"Error generating response: {e}")
+        response = f"Error: {str(e)}"
+        logger.info(f"Chatbot response: {response}")
+        history = history or []
+        history.append({"role": "user", "content": user_input})
+        history.append({"role": "assistant", "content": response})
+        end_time = time.time()
+        logger.info(f"Response time: {end_time - start_time:.2f} seconds")
+        return response, history, False, ""
+# Save cache
+def save_cache():
+    try:
+        with open(cache_file, 'w') as f:
+            json.dump(response_cache, f, indent=2)
+        logger.info("Saved cache to cache.json")
+    except Exception as e:
+        logger.warning(f"Failed to save cache.json: {e}")
+# Gradio interface
+logger.info("Initializing Gradio interface")
+try:
+    with gr.Blocks(
+        title="FinChat: An LLM based on distilgpt2 model",
+        css="""
+        .loader {
+            border: 5px solid #f3f3f3;
+            border-top: 5px solid #3498db;
+            border-radius: 50%;
+            width: 30px;
+            height: 30px;
+            animation: spin 1s linear infinite;
+            margin: 10px auto;
+            display: block;
+        }
+        @keyframes spin {
+            0% { transform: rotate(0deg); }
+            100% { transform: rotate(360deg); }
+        }
+        .hidden { display: none; }
+        """
+    ) as interface:
+        gr.Markdown(
+            """
+            # FinChat: An LLM based on distilgpt2 model
+            FinChat provides financial advice using the lightweight distilgpt2 model, optimized for fast, detailed responses.
+            Ask about investing strategies, ETFs, or stocks like TSLA, MSFT, NVDA, GOOG, AMZN, or S&P 500 to get started!
+            """
+        )
+        chatbot = gr.Chatbot(type="messages")
+        msg = gr.Textbox(label="Your message")
+        submit = gr.Button("Send")
+        clear = gr.Button("Clear")
+        loading = gr.HTML('<div class="loader hidden"></div>', label="Loading")
+        is_processing = gr.State(value=False)
+        def submit_message(user_input, history, is_processing):
+            response, updated_history, new_processing, clear_input = chat_with_model(user_input, history, is_processing)
+            loader_html = '<div class="loader"></div>' if new_processing else '<div class="loader hidden"></div>'
+            return clear_input, updated_history, loader_html, new_processing
+        submit.click(
+            fn=submit_message,
+            inputs=[msg, chatbot, is_processing],
+            outputs=[msg, chatbot, loading, is_processing]
+        )
+        clear.click(
+            fn=lambda: ("", [], '<div class="loader hidden"></div>', False),
+            outputs=[msg, chatbot, loading, is_processing]
+        )
+    logger.info("Gradio interface initialized successfully")
+except Exception as e:
+    logger.error(f"Error initializing Gradio interface: {e}")
+    raise
+# Launch interface
+if __name__ == "__main__" and not os.getenv("HF_SPACE"):
+    logger.info("Launching Gradio interface locally")
+    try:
+        interface.launch(share=False, debug=True)
+    except Exception as e:
+        logger.error(f"Error launching interface: {e}")
+        raise
+    finally:
+        save_cache()
+else:
+    logger.info("Running in Hugging Face Spaces, interface defined but not launched")
+    import atexit
+    atexit.register(save_cache)