Spaces:

point9
/

finryver-dev

Sleeping

App Files Files Community

Sahil Garg commited on Sep 18, 2025

Commit

c00e175

1 Parent(s): 6611563

openrouter replaced by mistral

Browse files

Files changed (4) hide show

notes/llm_notes_generator.py +15 -17
notes/utils/__init__.py +0 -0
notes/utils/utils.py +0 -57
notes/utils/utils_normalize.py +0 -60

notes/llm_notes_generator.py CHANGED Viewed

@@ -34,8 +34,8 @@ logger = logging.getLogger(__name__)
 class Settings(BaseSettings):
 	"""Application settings loaded from environment variables or .env file."""
-	openrouter_api_key: str = os.getenv('OPENROUTER_API_KEY', '')
-	api_url: str = "https://openrouter.ai/api/v1/chat/completions"
 	output_dir: str = "data/generated_notes"
 	trial_balance_json: str = "data/output1/parsed_trial_balance.json"
@@ -61,22 +61,20 @@ class GeneratedNote(BaseModel):
 class FlexibleFinancialNoteGenerator:
     def __init__(self):
-        self.openrouter_api_key = settings.openrouter_api_key
-        if not self.openrouter_api_key:
-            logger.error("OPENROUTER_API_KEY not found in .env file")
-            raise ValueError("OPENROUTER_API_KEY not found in .env file")
         self.api_url = settings.api_url
         self.headers = {
-            "Authorization": f"Bearer {self.openrouter_api_key}",
-            "Content-Type": "application/json",
-            "HTTP-Referer": "https://localhost:3000",
-            "X-Title": "Financial Note Generator"
         }
         self.note_templates = self.load_note_templates()
         self.account_patterns = self._init_account_patterns()
         self.recommended_models = [
-            "mistralai/mixtral-8x7b-instruct",
-            "mistralai/mistral-7b-instruct-v0.2"
         ]
     def _init_account_patterns(self) -> Dict[str, Dict[str, Any]]:
@@ -340,8 +338,8 @@ class FlexibleFinancialNoteGenerator:
         return prompt
-    def call_openrouter_api(self, prompt: str) -> Optional[str]:
-        """Make API call to OpenRouter with model fallback"""
         for model in self.recommended_models:
             logger.info(f"Trying model: {model}")
             payload = {
@@ -359,7 +357,7 @@ class FlexibleFinancialNoteGenerator:
                     self.api_url,
                     headers=self.headers,
                     json=payload,
-                    timeout=30  # <-- Add timeout here!
                 )
                 response.raise_for_status()
                 result = response.json()
@@ -450,7 +448,7 @@ class FlexibleFinancialNoteGenerator:
             logger.error("Failed to build prompt")
             return False
-        response = self.call_openrouter_api(prompt)
         if not response:
             logger.error("Failed to get API response")
             return False
@@ -475,7 +473,7 @@ class FlexibleFinancialNoteGenerator:
             if not prompt:
                 results[note_number] = False
                 continue
-            response = self.call_openrouter_api(prompt)
             if not response:
                 results[note_number] = False
                 continue

 class Settings(BaseSettings):
 	"""Application settings loaded from environment variables or .env file."""
+	mistral_api_key: str = os.getenv('MISTRAL_API_KEY', '')
+	api_url: str = "https://api.mistral.ai/v1/chat/completions"
 	output_dir: str = "data/generated_notes"
 	trial_balance_json: str = "data/output1/parsed_trial_balance.json"
 class FlexibleFinancialNoteGenerator:
     def __init__(self):
+        self.mistral_api_key = settings.mistral_api_key
+        if not self.mistral_api_key:
+            logger.error("MISTRAL_API_KEY not found in .env file")
+            raise ValueError("MISTRAL_API_KEY not found in .env file")
         self.api_url = settings.api_url
         self.headers = {
+            "Authorization": f"Bearer {self.mistral_api_key}",
+            "Content-Type": "application/json"
         }
         self.note_templates = self.load_note_templates()
         self.account_patterns = self._init_account_patterns()
         self.recommended_models = [
+            "mistral-large-latest",
+            "mistral-medium-latest"
         ]
     def _init_account_patterns(self) -> Dict[str, Dict[str, Any]]:
         return prompt
+    def call_mistral_api(self, prompt: str) -> Optional[str]:
+        """Make API call to Mistral with model fallback"""
         for model in self.recommended_models:
             logger.info(f"Trying model: {model}")
             payload = {
                     self.api_url,
                     headers=self.headers,
                     json=payload,
+                    timeout=30
                 )
                 response.raise_for_status()
                 result = response.json()
             logger.error("Failed to build prompt")
             return False
+        response = self.call_mistral_api(prompt)
         if not response:
             logger.error("Failed to get API response")
             return False
             if not prompt:
                 results[note_number] = False
                 continue
+            response = self.call_mistral_api(prompt)
             if not response:
                 results[note_number] = False
                 continue

notes/utils/__init__.py DELETED Viewed

File without changes

notes/utils/utils.py DELETED Viewed

@@ -1,57 +0,0 @@
-import logging
-from typing import Any, Union
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-def clean_value(value: Union[str, float, int, None]) -> float:
-	"""
-	Clean and convert a value to float.
-	Removes commas from strings and strips whitespace.
-	Returns 0.0 if conversion fails.
-	"""
-	try:
-		if isinstance(value, str):
-			value = value.replace(',', '').strip()
-		return float(value) if value else 0.0
-	except (ValueError, TypeError):
-		logger.debug(f"Could not clean value: {value}")
-		return 0.0
-def to_lakhs(value: Union[float, int, str]) -> float:
-	"""
-	Convert a numeric value to lakhs (divide by 100,000 and round to 2 decimals).
-	Accepts int, float, or numeric string.
-	"""
-	try:
-		if isinstance(value, str):
-			value = float(value.replace(',', '').strip())
-		return round(float(value) / 100000, 2)
-	except (ValueError, TypeError):
-		logger.debug(f"Could not convert to lakhs: {value}")
-		return 0.0
-def convert_note_json_to_lakhs(note_json: Any) -> Any:
-	"""
-	Recursively convert all numeric values in a note JSON to lakhs.
-	Returns the converted object.
-	"""
-	def convert(obj: Any) -> Any:
-		if isinstance(obj, dict):
-			for k, v in obj.items():
-				if isinstance(v, (int, float)):
-					obj[k] = to_lakhs(v)
-				elif isinstance(v, str):
-					try:
-						obj[k] = to_lakhs(float(v.replace(',', '')))
-					except Exception:
-						obj[k] = v
-				else:
-					obj[k] = convert(v)
-		elif isinstance(obj, list):
-			for i in range(len(obj)):
-				obj[i] = convert(obj[i])
-		return obj
-	return convert(note_json)

notes/utils/utils_normalize.py DELETED Viewed

@@ -1,60 +0,0 @@
-import logging
-from typing import Any, Dict, List, Optional
-from pydantic import BaseModel, ValidationError
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-class NormalizedNote(BaseModel):
-	note_number: Optional[str]
-	note_title: Optional[str]
-	full_title: Optional[str]
-	table_data: List[Dict[str, Any]]
-	breakdown: Dict[str, Any] = {}
-	matched_accounts: List[Any] = []
-	total_amount: Optional[float] = None
-	total_amount_lakhs: Optional[float] = None
-	matched_accounts_count: Optional[int] = None
-	comparative_data: Dict[str, Any] = {}
-	notes_and_disclosures: List[str] = []
-	markdown_content: Optional[str] = ""
-def is_date_label(label: str) -> bool:
-	"""Check if a label is a date string."""
-	import re
-	return bool(re.match(r"^(March|April|May|June|July|August|September|October|November|December)\s+\d{1,2},\s+\d{4}$", label)) \
-		or bool(re.match(r"^\d{4}-\d{2}-\d{2}$", label))
-def normalize_llm_note_json(llm_json: Dict[str, Any]) -> Dict[str, Any]:
-	"""
-	Normalize a single LLM-generated note JSON to standard format.
-	Returns a dict compatible with NormalizedNote.
-	"""
-	note_number = llm_json.get("note_number") or llm_json.get("metadata", {}).get("note_number", "")
-	note_title = llm_json.get("note_title") or llm_json.get("title", "")
-	full_title = llm_json.get("full_title") or (f"{note_number}. {note_title}" if note_number else note_title)
-	table_data: List[Dict[str, Any]] = []
-	if "structure" in llm_json and llm_json["structure"]:
-		for item in llm_json["structure"]:
-			if "subcategories" in item and item["subcategories"]:
-				for sub in item["subcategories"]:
-					label = sub.get("label", "")
-					if not is_date_label(label):
-						row = {
-							"particulars": label,
-							"current_year": sub.get("value", ""),
-							"previous_year": sub.get("previous_value", "-"),
-						}
-						table_data.append(row)
-			if "category" in item and ("total" in item or "previous_total" in item):
-				row = {
-					"particulars": f"Total {item.get('category', '')}",
-					"current_year": item.get("total", ""),
-					"previous_year": item.get("previous_total", "-"),
-				}
-				table_data.append(row)
-	# Optionally, add a header row