danulr05 commited on
Commit
af234c7
·
verified ·
1 Parent(s): 6f7b77d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -334,7 +334,8 @@ def search_budget_proposals(query: str) -> str:
334
  if not language_specific_matches:
335
  language_specific_matches = matches[:3]
336
  else:
337
- language_specific_matches = language_specific_matches[:3] # Limit to top 3
 
338
 
339
  logger.info(f"Using {len(language_specific_matches)} language-specific matches for {detected_language}")
340
 
@@ -706,9 +707,9 @@ def get_document_language(filename: str) -> str:
706
  """Determine the language of a document from its filename"""
707
  filename_lower = filename.lower()
708
 
709
- if '_sin_' in filename_lower or '_sinhala_' in filename_lower:
710
  return 'si'
711
- elif '_tam_' in filename_lower or '_tamil_' in filename_lower:
712
  return 'ta'
713
  elif '_raj_' in filename_lower:
714
  return 'en' # Treat Raj as English/default
 
334
  if not language_specific_matches:
335
  language_specific_matches = matches[:3]
336
  else:
337
+ # Prioritize by relevance - take only the first (most relevant) language-specific match
338
+ language_specific_matches = language_specific_matches[:1]
339
 
340
  logger.info(f"Using {len(language_specific_matches)} language-specific matches for {detected_language}")
341
 
 
707
  """Determine the language of a document from its filename"""
708
  filename_lower = filename.lower()
709
 
710
+ if any(indicator in filename_lower for indicator in ['_sin_', '-sin', 'sinhala', 'si/', '- sinhala']):
711
  return 'si'
712
+ elif any(indicator in filename_lower for indicator in ['_tam_', '-tam', 'tamil', 'ta/']):
713
  return 'ta'
714
  elif '_raj_' in filename_lower:
715
  return 'en' # Treat Raj as English/default