LexGuard MCP

lexguard-mcp
src
services

smart_search_service.py•60.1 KiB

""" Smart Search Service - 사용자 질문을 분석하여 적절한 API를 자동 선택 """ import re from datetime import datetime, timedelta from typing import Optional, Dict, List, Tuple from .api_router import APIRouter, DomainType, APICategory from ..repositories.law_repository import LawRepository from ..repositories.law_detail import LawDetailRepository from ..repositories.precedent_repository import PrecedentRepository from ..repositories.law_interpretation_repository import LawInterpretationRepository from ..repositories.administrative_appeal_repository import AdministrativeAppealRepository from ..repositories.constitutional_decision_repository import ConstitutionalDecisionRepository from ..repositories.committee_decision_repository import CommitteeDecisionRepository from ..repositories.special_administrative_appeal_repository import SpecialAdministrativeAppealRepository from ..repositories.local_ordinance_repository import LocalOrdinanceRepository from ..repositories.administrative_rule_repository import AdministrativeRuleRepository from ..repositories.law_comparison_repository import LawComparisonRepository class SmartSearchService: """ 사용자 질문을 분석하여 적절한 법적 정보 소스를 자동으로 선택하는 서비스 LLM이 사용자 질문을 받으면: 1. 질문 의도 분석 (법령, 판례, 법령해석, 행정심판 등) 2. 적절한 검색 타입 선택 3. 파라미터 자동 추출 4. 통합 검색 실행 """ def __init__(self): self.law_search_repo = LawRepository() self.law_detail_repo = LawDetailRepository() self.precedent_repo = PrecedentRepository() self.interpretation_repo = LawInterpretationRepository() self.appeal_repo = AdministrativeAppealRepository() self.constitutional_repo = ConstitutionalDecisionRepository() self.committee_repo = CommitteeDecisionRepository() self.special_appeal_repo = SpecialAdministrativeAppealRepository() self.ordinance_repo = LocalOrdinanceRepository() self.rule_repo = AdministrativeRuleRepository() self.comparison_repo = LawComparisonRepository() # 완벽한 API 라우터 (172개 API 관리) self.api_router = APIRouter() # 의도 분류 키워드 (세분화됨) self.intent_keywords = { "law": { "keywords": ["법령", "법", "조문", "조항", "법률", "시행령", "시행규칙", "법 제", "법률 제"], "patterns": [r"법\s*제?\s*\d+조", r"법령\s*제?\s*\d+조", r"\w+법\s*제?\s*\d+조"] }, "precedent": { "keywords": ["판례", "대법원", "판결", "선고", "사건", "재판", "법원", "관련 판례", "관련사례"], "patterns": [r"판례", r"대법원\s*\d+", r"사건번호", r"관련\s*판례", r"관련\s*사례"] }, # 노동 세분화 "labor_worker_status": { "keywords": ["근로자성", "사용종속", "지휘감독", "위장도급", "프리랜서", "근로자 인정", "4대보험", "근로자 판단"], "patterns": [r"근로자성", r"위장도급", r"사용종속", r"프리랜서.*근로자"] }, "labor_termination": { "keywords": ["해고", "부당해고", "정리해고", "계약해지", "해고 사유", "일방적 해지"], "patterns": [r"부당해고", r"해고.*사유", r"계약.*해지"] }, "labor_wage": { "keywords": ["임금", "퇴직금", "체불", "임금체불", "보수", "급여", "미지급", "연장근로수당"], "patterns": [r"임금체불", r"퇴직금.*계산", r"급여.*미지급"] }, "interpretation": { "keywords": ["법령해석", "해석", "의견", "해석례", "법제처", "부처 해석"], "patterns": [r"법령해석", r"해석\s*의견"] }, "administrative_appeal": { "keywords": ["행정심판", "심판", "재결", "행정심판위원회"], "patterns": [r"행정심판", r"재결례"] }, "constitutional": { "keywords": ["헌법재판소", "헌재", "위헌", "헌법", "헌법재판"], "patterns": [r"헌법재판소", r"헌재", r"위헌"] }, "committee": { "keywords": ["위원회", "결정문", "개인정보보호위원회", "금융위원회", "노동위원회"], "patterns": [r"\w+위원회", r"결정문"] }, "special_appeal": { "keywords": ["조세심판원", "해양안전심판원", "특별행정심판"], "patterns": [r"조세심판원", r"해양안전심판원", r"특별행정심판"] }, "ordinance": { "keywords": ["조례", "규칙", "지방자치", "시조례", "도조례"], "patterns": [r"\w+조례", r"지방자치"] }, "rule": { "keywords": ["행정규칙", "훈령", "예규", "고시"], "patterns": [r"행정규칙", r"훈령", r"예규"] }, "comparison": { "keywords": ["비교", "신구법", "연혁", "변경", "개정"], "patterns": [r"신구법", r"연혁", r"비교"] } } def analyze_intent(self, query: str) -> List[Tuple[str, float]]: """ 사용자 질문의 의도를 분석하여 검색 타입과 신뢰도를 반환 Returns: [(search_type, confidence), ...] - 신뢰도 순으로 정렬 """ query_lower = query.lower() scores = {} for search_type, config in self.intent_keywords.items(): score = 0.0 # 키워드 매칭 for keyword in config["keywords"]: if keyword in query_lower: score += 1.0 # 패턴 매칭 for pattern in config.get("patterns", []): if re.search(pattern, query, re.IGNORECASE): score += 2.0 # 패턴 매칭이 더 높은 가중치 if score > 0: scores[search_type] = score # 신뢰도 순으로 정렬 sorted_scores = sorted(scores.items(), key=lambda x: x[1], reverse=True) # 신뢰도를 0-1 범위로 정규화 if sorted_scores: max_score = sorted_scores[0][1] normalized = [(st, min(score / max_score, 1.0)) for st, score in sorted_scores] # 여러 의도 동시 감지: 신뢰도 0.5 이상인 모든 의도 반환 # 예: "형법 제250조와 관련 판례" → ["law", "precedent"] high_confidence = [(st, conf) for st, conf in normalized if conf >= 0.5] if len(high_confidence) > 1: # 여러 의도가 감지되면 모두 반환 return high_confidence elif high_confidence: # 단일 의도지만 신뢰도가 높으면 반환 return high_confidence else: # 신뢰도가 낮으면 최상위 1개만 반환 return normalized[:1] # 기본값: 법령 검색 return [("law", 0.5)] def parse_time_condition(self, query: str) -> Optional[Dict[str, str]]: """ 질문에서 시간 조건을 파싱하여 date_from, date_to 반환 Examples: "최근 5년 판례" → {"date_from": "20210115", "date_to": "20260115"} "2023년 이후 판례" → {"date_from": "20230101", "date_to": "20260115"} "2020년부터 2023년까지" → {"date_from": "20200101", "date_to": "20231231"} "예전 판례와 요즘 판례" → {"date_from": "20210115", "date_to": "20260115"} Returns: {"date_from": "YYYYMMDD", "date_to": "YYYYMMDD"} or None """ today = datetime.now() time_filter = None # 패턴 1: "최근 N년" match = re.search(r"최근\s*(\d+)\s*년", query) if match: years = int(match.group(1)) date_from = (today - timedelta(days=years*365)).strftime("%Y%m%d") date_to = today.strftime("%Y%m%d") return {"date_from": date_from, "date_to": date_to} # 패턴 2: "YYYY년 이후" match = re.search(r"(\d{4})\s*년\s*이후", query) if match: year = int(match.group(1)) date_from = f"{year}0101" date_to = today.strftime("%Y%m%d") return {"date_from": date_from, "date_to": date_to} # 패턴 3: "YYYY년부터 YYYY년까지" match = re.search(r"(\d{4})\s*년\s*부터\s*(\d{4})\s*년\s*까지", query) if match: year_from = int(match.group(1)) year_to = int(match.group(2)) date_from = f"{year_from}0101" date_to = f"{year_to}1231" return {"date_from": date_from, "date_to": date_to} # 패턴 4: "예전/과거" vs "요즘/최근" (기본 5년) if re.search(r"예전.*요즘|과거.*최근|예전.*최근", query): date_from = (today - timedelta(days=5*365)).strftime("%Y%m%d") date_to = today.strftime("%Y%m%d") return {"date_from": date_from, "date_to": date_to} # 패턴 5: "최신", "요즘" (3년) if re.search(r"최신|요즘|근래", query): date_from = (today - timedelta(days=3*365)).strftime("%Y%m%d") date_to = today.strftime("%Y%m%d") return {"date_from": date_from, "date_to": date_to} return None def plan_queries(self, query: str, intent: str) -> List[str]: """ Intent별로 다단계 검색 쿼리 생성 Args: query: 원본 질문 intent: analyze_intent에서 분류된 intent Returns: 검색 쿼리 리스트 (넓게 → 좁게) """ # 노동-근로자성/위장도급 if intent == "labor_worker_status": base_keywords = ["근로자성", "사용종속관계", "프리랜서"] if "프리랜서" in query or "용역" in query: return [ "근로자성 판단 기준", "사용종속관계", "프리랜서 근로자 인정 판례", "위장도급 판단 기준" ] else: return [ "근로자성", "사용종속관계 판례", "지휘감독 근로자성" ] # 노동-해고/해지 elif intent == "labor_termination": return [ "부당해고", "정당한 해고 사유", "해고 절차 위반", "계약해지 손해배상" ] # 노동-임금/퇴직금 elif intent == "labor_wage": if "퇴직금" in query: return [ "퇴직금 계산", "퇴직금 지급 기준", "근속연수 퇴직금" ] elif "체불" in query or "미지급" in query: return [ "임금체불", "임금 미지급 신고", "지연이자 임금" ] else: return [ "임금", "통상임금", "임금 전액지급 원칙" ] # 기본값: 원본 query return [query] async def comprehensive_search_v2( self, query: str, max_results_per_type: int = 3, arguments: Optional[dict] = None, document_text: Optional[str] = None ) -> Dict: """ 완벽한 다단계 검색 파이프라인 (v2) - API Router 기반으로 172개 API 활용 - 도메인 감지 → Intent 분류 → API 순서 계획 → 다단계 검색 Args: query: 사용자 질문 max_results_per_type: 타입당 최대 결과 수 arguments: 추가 인자 document_text: 문서 전문 (옵션) Returns: 통합 검색 결과 (모든 API 결과 포함) """ import asyncio import logging logger = logging.getLogger("lexguard-mcp") start_time = datetime.now() # 1단계: 도메인 감지 domain = self.api_router.detect_domain(query, document_text) logger.info(f"Domain detected | domain={domain.value} query={query[:50]}") # 2단계: Intent 분류 intent_results = self.analyze_intent(query) primary_intent = intent_results[0][0] if intent_results else "general" logger.info(f"Intent analyzed | intent={primary_intent}") # 3단계: 시간 조건 파싱 time_condition = self.parse_time_condition(query) # 4단계: API 호출 순서 계획 api_sequence = self.api_router.plan_api_sequence(query, domain, primary_intent, document_text) logger.info(f"API sequence planned | steps={len(api_sequence)}") # 5단계: 다단계 검색 실행 all_results = {} sources_count = {} for i, (api_category, params) in enumerate(api_sequence[:5], 1): # 최대 5단계 try: if api_category == APICategory.LAW: target_laws = params.get("target_laws", []) if target_laws: for law_name in target_laws[:2]: result = await asyncio.to_thread( self.law_detail_repo.get_law, None, law_name, "detail", None, None, None, None, arguments ) if result and not result.get("error"): all_results.setdefault("laws", []).append(result) else: result = await asyncio.to_thread( self.law_search_repo.search_law, query, 1, max_results_per_type, arguments ) if result and result.get("laws"): all_results["laws"] = result["laws"] sources_count["law"] = len(all_results.get("laws", [])) elif api_category == APICategory.PRECEDENT: result = await asyncio.to_thread( self.precedent_repo.search_precedent, query, 1, max_results_per_type, time_condition.get("date_from") if time_condition else None, time_condition.get("date_to") if time_condition else None, None, arguments ) if result and result.get("precedents"): all_results["precedents"] = result["precedents"] sources_count["precedent"] = len(result["precedents"]) except Exception as e: logger.error(f"API call failed | category={api_category.value} error={e}") continue # 6단계: 결과 통합 total_sources = sum(sources_count.values()) has_legal_basis = total_sources > 0 elapsed = (datetime.now() - start_time).total_seconds() return { "success": True, "success_transport": True, "success_search": has_legal_basis, "has_legal_basis": has_legal_basis, "query": query, "domain": domain.value, "detected_intent": primary_intent, "results": all_results, "sources_count": sources_count, "total_sources": total_sources, "missing_reason": None if has_legal_basis else "NO_MATCH", "elapsed_seconds": elapsed, "pipeline_version": "v2_complete_coverage" } def extract_parameters(self, query: str, search_type: str) -> Dict: """ 질문에서 검색 파라미터를 자동 추출 Args: query: 사용자 질문 search_type: 검색 타입 Returns: 추출된 파라미터 딕셔너리 """ params = {"query": query} # 법령명 추출 (예: "형법", "민법", "개인정보보호법") law_name_pattern = r"([가-힣]+법)" law_matches = re.findall(law_name_pattern, query) if law_matches: params["law_name"] = law_matches[0] # 조문 번호 추출 (예: "제250조", "250조") article_pattern = r"제?\s*(\d+)\s*조" article_matches = re.findall(article_pattern, query) if article_matches: # 정규화 유틸리티 사용 from ..utils.parameter_normalizer import normalize_article_number params["article_number"] = normalize_article_number(article_matches[0]) # 항(項) 번호 추출 (예: "제1항", "1항", "첫 번째 항") hang_patterns = [ r"제?\s*(\d+)\s*항", # "제1항", "1항" r"(\d+)\s*번째\s*항", # "첫 번째 항" (숫자만) r"제?\s*(\d+)\s*번\s*항", # "제1번 항" ] for pattern in hang_patterns: hang_matches = re.findall(pattern, query) if hang_matches: from ..utils.parameter_normalizer import normalize_hang params["hang"] = normalize_hang(hang_matches[0]) break # 호(號) 번호 추출 (예: "제2호", "2호", "둘째 호") ho_patterns = [ r"제?\s*(\d+)\s*호", # "제2호", "2호" r"(\d+)\s*번째\s*호", # "둘째 호" (숫자만) r"제?\s*(\d+)\s*번\s*호", # "제2번 호" ] for pattern in ho_patterns: ho_matches = re.findall(pattern, query) if ho_matches: from ..utils.parameter_normalizer import normalize_ho params["ho"] = normalize_ho(ho_matches[0]) break # 목(目) 문자 추출 (예: "가목", "나목", "다목") mok_pattern = r"([가-힣])\s*목" mok_matches = re.findall(mok_pattern, query) if mok_matches: from ..utils.parameter_normalizer import normalize_mok params["mok"] = normalize_mok(mok_matches[0] + "목") # 비교 타입 추출 (법령 비교용) if search_type == "comparison": if "연혁" in query or "변경사항" in query or "개정" in query: params["compare_type"] = "연혁" elif "3단" in query or "세단계" in query: params["compare_type"] = "3단비교" else: params["compare_type"] = "신구법" # 기본값 # 날짜 추출 (예: "2023년", "2023.01.01") date_pattern = r"(\d{4})[년\.]?\s*(\d{1,2})[월\.]?\s*(\d{1,2})[일]?" date_matches = re.findall(date_pattern, query) if date_matches: year, month, day = date_matches[0] params["date"] = f"{year}{month.zfill(2)}{day.zfill(2)}" if day else f"{year}{month.zfill(2)}01" # 기관명 추출 (위원회, 특별행정심판원, 부처) # 위원회 (11개) committee_patterns = { "개인정보보호위원회": "개인정보보호위원회", "금융위원회": "금융위원회", "노동위원회": "노동위원회", "고용보험심사위원회": "고용보험심사위원회", "국민권익위원회": "국민권익위원회", "방송미디어통신위원회": "방송미디어통신위원회", "산업재해보상보험재심사위원회": "산업재해보상보험재심사위원회", "중앙토지수용위원회": "중앙토지수용위원회", "중앙환경분쟁조정위원회": "중앙환경분쟁조정위원회", "증권선물위원회": "증권선물위원회", "국가인권위원회": "국가인권위원회", } # 특별행정심판원 (4개) tribunal_patterns = { "조세심판원": "조세심판원", "해양안전심판원": "해양안전심판원", "국민권익위원회": "국민권익위원회", "인사혁신처 소청심사위원회": "인사혁신처 소청심사위원회", } # 부처 (39개) - 법령해석/행정규칙 검색용 agency_patterns = { "기획재정부": "기획재정부", "국세청": "국세청", "관세청": "관세청", "고용노동부": "고용노동부", "교육부": "교육부", "보건복지부": "보건복지부", "질병관리청": "질병관리청", "식품의약품안전처": "식품의약품안전처", "법무부": "법무부", "외교부": "외교부", "국방부": "국방부", "방위사업청": "방위사업청", "병무청": "병무청", "행정안전부": "행정안전부", "경찰청": "경찰청", "소방청": "소방청", "해양경찰청": "해양경찰청", "문화체육관광부": "문화체육관광부", "농림축산식품부": "농림축산식품부", "농촌진흥청": "농촌진흥청", "산림청": "산림청", "산업통상부": "산업통상부", "중소벤처기업부": "중소벤처기업부", "과학기술정보통신부": "과학기술정보통신부", "국가데이터처": "국가데이터처", "지식재산처": "지식재산처", "기상청": "기상청", "해양수산부": "해양수산부", "국토교통부": "국토교통부", "행정중심복합도시건설청": "행정중심복합도시건설청", "기후에너지환경부": "기후에너지환경부", "통일부": "통일부", "국가보훈부": "국가보훈부", "성평등가족부": "성평등가족부", "재외동포청": "재외동포청", "인사혁신처": "인사혁신처", "법제처": "법제처", "조달청": "조달청", "국가유산청": "국가유산청", } # 위원회 매칭 if search_type == "committee": for agency_name, agency_key in committee_patterns.items(): if agency_name in query: params["committee_type"] = agency_key break # 특별행정심판원 매칭 elif search_type == "special_appeal": for agency_name, agency_key in tribunal_patterns.items(): if agency_name in query: params["tribunal_type"] = agency_key break # 부처 매칭 (법령해석/행정규칙 검색용) elif search_type in ["interpretation", "rule"]: for agency_name, agency_key in agency_patterns.items(): if agency_name in query: params["agency"] = agency_key break # 지방자치단체 매칭 (자치법규 검색용) elif search_type == "ordinance": # 주요 지방자치단체명 패턴 local_gov_patterns = { "서울": "서울특별시", "부산": "부산광역시", "대구": "대구광역시", "인천": "인천광역시", "광주": "광주광역시", "대전": "대전광역시", "울산": "울산광역시", "세종": "세종특별자치시", "경기": "경기도", "강원": "강원특별자치도", "충북": "충청북도", "충남": "충청남도", "전북": "전북특별자치도", "전남": "전라남도", "경북": "경상북도", "경남": "경상남도", "제주": "제주특별자치도", } for pattern, full_name in local_gov_patterns.items(): if pattern in query: params["local_government"] = full_name break return params async def smart_search( self, query: str, search_types: Optional[List[str]] = None, max_results_per_type: int = 5, arguments: Optional[dict] = None ) -> Dict: """ 사용자 질문을 분석하여 적절한 검색을 자동으로 수행 Args: query: 사용자 질문 search_types: 강제로 검색할 타입 목록 (None이면 자동 분석) max_results_per_type: 타입당 최대 결과 수 arguments: 추가 인자 (API 키 등) Returns: 통합 검색 결과 """ import asyncio # 의도 분석 clarification_needed = False possible_intents = [] # 매우 모호한 질문인지 먼저 확인 (의도 분석 전에) query_stripped = query.strip() very_ambiguous_keywords = ["법", "법률", "정보", "찾아줘", "알려줘", "확인", "검색", "알려주세요", "찾아주세요"] very_ambiguous = ( len(query_stripped) <= 3 or query_stripped in very_ambiguous_keywords ) if very_ambiguous: clarification_needed = True possible_intents = [ {"type": "law", "description": "법령 검색", "example": "형법 제250조"}, {"type": "precedent", "description": "판례 검색", "example": "손해배상 판례"}, {"type": "interpretation", "description": "법령해석 검색", "example": "개인정보보호법 해석"}, {"type": "administrative_appeal", "description": "행정심판 검색", "example": "행정심판 사례"}, {"type": "constitutional", "description": "헌재결정 검색", "example": "위헌 결정례"} ] if search_types is None and not clarification_needed: intent_results = self.analyze_intent(query) # 여러 의도 동시 감지: 신뢰도 0.3 이상인 모든 의도 포함 # 예: "형법 제250조와 관련 판례" → ["law", "precedent"] search_types = [st for st, conf in intent_results if conf > 0.3] # 모호한 질문 처리: 의도가 명확하지 않으면 법령 검색 기본값 if not search_types: # 매우 모호한 질문인 경우 clarification 필요 # 단일 단어이거나 매우 짧은 질문인 경우 query_stripped = query.strip() very_ambiguous_keywords = ["법", "법률", "정보", "찾아줘", "알려줘", "확인", "검색", "알려주세요", "찾아주세요"] very_ambiguous = ( len(query_stripped) <= 3 or query_stripped in very_ambiguous_keywords ) if very_ambiguous: clarification_needed = True # 가능한 의도 후보 생성 possible_intents = [ {"type": "law", "description": "법령 검색", "example": "형법 제250조"}, {"type": "precedent", "description": "판례 검색", "example": "손해배상 판례"}, {"type": "interpretation", "description": "법령해석 검색", "example": "개인정보보호법 해석"}, {"type": "administrative_appeal", "description": "행정심판 검색", "example": "행정심판 사례"}, {"type": "constitutional", "description": "헌재결정 검색", "example": "위헌 결정례"} ] # clarification이 필요한 경우 search_types를 설정하지 않음 else: # "관련" 같은 키워드가 있으면 법령 검색 # 단, "찾아줘", "알려줘" 같은 단독 키워드는 이미 very_ambiguous에서 처리됨 if "관련" in query: search_types = ["law"] else: search_types = ["law"] # 기본값 # clarification이 필요한 경우 조기 반환 (search_types 설정 전에) if clarification_needed: return { "success": False, "clarification_needed": True, "query": query, "possible_intents": possible_intents, "suggestion": "더 구체적인 질문을 해주시면 정확한 정보를 찾아드릴 수 있습니다. 예: '형법 제250조', '손해배상 판례', '개인정보보호법 해석' 등" } # search_types가 없으면 기본값 설정 if not search_types: search_types = ["law"] # 기본값 # 시간 조건 파싱 (공통) time_condition = self.parse_time_condition(query) # 파라미터 추출 all_params = {} for st in search_types: params = self.extract_parameters(query, st) # 시간 조건 추가 (판례/헌재결정/행정심판 등에 적용) if time_condition and st in ["precedent", "constitutional", "administrative_appeal", "committee", "special_appeal"]: params.update(time_condition) all_params[st] = params # 쿼리 전처리: 긴 문장에서 핵심 키워드만 추출 (API 에러 방지) def extract_keywords(text: str) -> str: """긴 문장에서 핵심 키워드만 추출""" # 법령명 패턴 제거 (이미 extract_parameters에서 처리) # 질문어 제거 question_words = ["인가", "인지", "인가요", "인지요", "인가?", "인지?", "뭐야", "뭐야?", "알려줘", "알려줘요", "찾아줘", "찾아줘요"] cleaned = text for qw in question_words: cleaned = cleaned.replace(qw, "") # 핵심 키워드 추출 (2-4글자 명사 위주) import re # 한글 명사 패턴 (2글자 이상) keywords = re.findall(r'[가-힣]{2,}', cleaned) # 중복 제거하고 길이 순 정렬 keywords = sorted(set(keywords), key=len, reverse=True) # 상위 3-5개만 선택 return " ".join(keywords[:5]) # 키워드 추출 keyword_query = extract_keywords(query) # 병렬 검색 실행 results = {} for search_type in search_types[:3]: # 최대 3개 타입만 검색 try: params = all_params.get(search_type, {"query": query}) params["per_page"] = max_results_per_type params["page"] = 1 if search_type == "law": if "law_name" in params: # get_law 시그니처: get_law(law_id=None, law_name=None, mode="detail", article_number=None, ...) mode = "single" if "article_number" in params else "detail" # 항, 호, 목 파라미터도 전달 (복잡한 파라미터 자동 추출 강화) result = await asyncio.to_thread( self.law_detail_repo.get_law, None, # law_id params["law_name"], # law_name mode, # mode params.get("article_number"), # article_number params.get("hang"), # hang (자동 추출) params.get("ho"), # ho (자동 추출) params.get("mok"), # mok (자동 추출) arguments ) else: # 첫 시도: 원본 query result = await asyncio.to_thread( self.law_search_repo.search_law, query, 1, max_results_per_type, arguments ) # 실패 시 Fallback: 키워드만으로 재시도 if result and "error" in result and not result.get("laws"): if keyword_query and keyword_query != query: import logging logger = logging.getLogger("lexguard-mcp") logger.info(f"Law search fallback: using keywords '{keyword_query}' instead of full query") result = await asyncio.to_thread( self.law_search_repo.search_law, keyword_query, 1, max_results_per_type, arguments ) # 여전히 실패 시: 도메인별 직접 법령명 검색 if result and "error" in result and not result.get("laws"): # 노동 관련 키워드가 있으면 "근로기준법" 직접 검색 if any(k in query for k in ["근로", "노동", "해고", "퇴직", "임금", "프리랜서", "근로자"]): import logging logger = logging.getLogger("lexguard-mcp") logger.info("Law search fallback: directly searching '근로기준법'") result = await asyncio.to_thread( self.law_detail_repo.get_law, None, "근로기준법", "detail", None, None, None, None, arguments ) elif search_type == "precedent": # 첫 시도: 원본 query result = await asyncio.to_thread( self.precedent_repo.search_precedent, query, 1, max_results_per_type, None, None, None, arguments ) # 실패 시 Fallback: 키워드만으로 재시도 if result and "error" in result and not result.get("precedents"): if keyword_query and keyword_query != query: import logging logger = logging.getLogger("lexguard-mcp") logger.info(f"Precedent search fallback: using keywords '{keyword_query}' instead of full query") result = await asyncio.to_thread( self.precedent_repo.search_precedent, keyword_query, 1, max_results_per_type, None, None, None, arguments ) # 여전히 실패 시: 핵심 키워드 1-2개만으로 재시도 if result and "error" in result and not result.get("precedents"): keywords = keyword_query.split() if len(keywords) >= 2: # 가장 긴 키워드 2개만 사용 short_query = " ".join(keywords[:2]) import logging logger = logging.getLogger("lexguard-mcp") logger.info(f"Precedent search fallback: using short query '{short_query}'") result = await asyncio.to_thread( self.precedent_repo.search_precedent, short_query, 1, max_results_per_type, None, None, None, arguments ) elif search_type == "interpretation": # 첫 시도: 원본 query result = await asyncio.to_thread( self.interpretation_repo.search_law_interpretation, query, 1, max_results_per_type, params.get("agency"), # 부처명 전달 arguments ) # 실패 시 Fallback: 키워드만으로 재시도 if result and "error" in result and not result.get("interpretations"): if keyword_query and keyword_query != query: import logging logger = logging.getLogger("lexguard-mcp") logger.info(f"Interpretation search fallback: using keywords '{keyword_query}' instead of full query") result = await asyncio.to_thread( self.interpretation_repo.search_law_interpretation, keyword_query, 1, max_results_per_type, params.get("agency"), arguments ) elif search_type == "administrative_appeal": result = await asyncio.to_thread( self.appeal_repo.search_administrative_appeal, query, 1, max_results_per_type, None, None, arguments ) elif search_type == "constitutional": result = await asyncio.to_thread( self.constitutional_repo.search_constitutional_decision, query, 1, max_results_per_type, None, None, arguments ) elif search_type == "committee" and "committee_type" in params: result = await asyncio.to_thread( self.committee_repo.search_committee_decision, params["committee_type"], query, 1, max_results_per_type, arguments ) elif search_type == "special_appeal" and "tribunal_type" in params: result = await asyncio.to_thread( self.special_appeal_repo.search_special_administrative_appeal, params["tribunal_type"], query, 1, max_results_per_type, arguments ) elif search_type == "ordinance": result = await asyncio.to_thread( self.ordinance_repo.search_local_ordinance, query, None, 1, max_results_per_type, arguments ) elif search_type == "rule": result = await asyncio.to_thread( self.rule_repo.search_administrative_rule, query, params.get("agency"), # 부처명 전달 1, max_results_per_type, arguments ) elif search_type == "comparison" and "law_name" in params: # 법령 비교는 law_name이 필요 compare_type = params.get("compare_type", "신구법") result = await asyncio.to_thread( self.comparison_repo.compare_laws, params["law_name"], compare_type, arguments ) else: continue # 결과가 있으면 추가 if result: # 에러가 없으면 무조건 추가 if "error" not in result: results[search_type] = result # 에러가 있어도 부분 결과가 있으면 추가 elif (result.get("laws") or result.get("precedents") or result.get("interpretations") or result.get("appeals") or result.get("decisions") or result.get("law_name") or result.get("law_id") or result.get("detail") or result.get("precedent") or result.get("interpretation")): results[search_type] = result else: # 에러만 있고 결과가 없으면 로깅만 하고 추가하지 않음 logger.debug(f"Result for {search_type} has error and no data: {result.get('error', 'Unknown error')}") except Exception as e: logger.exception(f"Error in smart_search for {search_type}: {e}") # 에러도 결과에 포함하여 디버깅 가능하게 results[search_type] = { "error": str(e), "recovery_guide": "시스템 오류가 발생했습니다. 서버 로그를 확인하거나 관리자에게 문의하세요." } # 부분 실패 처리 개선 successful_types = [] failed_types = [] partial_success = False for search_type, result in results.items(): # result가 딕셔너리인지 확인 if not isinstance(result, dict): continue # 에러가 없는 경우 if "error" not in result: successful_types.append(search_type) else: # 에러가 있지만 부분 결과가 있는지 확인 has_partial_data = False # 다양한 결과 필드 확인 data_fields = [ "laws", "precedents", "interpretations", "appeals", "decisions", "law_name", "law_id", "detail", "precedent", "interpretation", "total", "count", "items", "data" ] for field in data_fields: if field in result and result[field]: has_partial_data = True break # 리스트나 딕셔너리 타입의 결과 확인 if not has_partial_data: for key, value in result.items(): if key != "error" and key != "recovery_guide": if isinstance(value, (list, dict)) and len(value) > 0: has_partial_data = True break elif value and not isinstance(value, str): has_partial_data = True break if has_partial_data: partial_success = True successful_types.append(search_type) else: failed_types.append(search_type) # sources_count 계산 sources_count = { "law": 0, "precedent": 0, "interpretation": 0, "administrative_appeal": 0, "constitutional": 0, "committee": 0, "special_appeal": 0, "ordinance": 0, "rule": 0 } for search_type, result in results.items(): if isinstance(result, dict): if search_type == "law": if "laws" in result: sources_count["law"] = len(result.get("laws", [])) elif "law_name" in result: sources_count["law"] = 1 elif search_type == "precedent" and "precedents" in result: sources_count["precedent"] = len(result.get("precedents", [])) elif search_type == "interpretation" and "interpretations" in result: sources_count["interpretation"] = len(result.get("interpretations", [])) elif search_type == "administrative_appeal" and "appeals" in result: sources_count["administrative_appeal"] = len(result.get("appeals", [])) elif search_type == "constitutional" and "decisions" in result: sources_count["constitutional"] = len(result.get("decisions", [])) elif search_type == "committee" and "decisions" in result: sources_count["committee"] = len(result.get("decisions", [])) elif search_type == "special_appeal" and "appeals" in result: sources_count["special_appeal"] = len(result.get("appeals", [])) elif search_type == "ordinance" and "ordinances" in result: sources_count["ordinance"] = len(result.get("ordinances", [])) elif search_type == "rule" and "rules" in result: sources_count["rule"] = len(result.get("rules", [])) # has_legal_basis 판단 total_sources = sum(sources_count.values()) has_legal_basis = total_sources > 0 # missing_reason 판단 missing_reason = None if not has_legal_basis: # API 에러 여부 확인 (api_error / error+api_url / text/html) api_error_found = False html_error_found = False auth_error_found = False timeout_error_found = False other_error_found = False for _, result in results.items(): if isinstance(result, dict): content_type = result.get("content_type") or result.get("api_error", {}).get("content_type") error_code = result.get("error_code") or result.get("api_error", {}).get("error_code") if error_code == "API_ERROR_HTML": html_error_found = True if error_code == "API_ERROR_AUTH": auth_error_found = True if error_code == "API_ERROR_TIMEOUT": timeout_error_found = True if error_code == "API_ERROR_OTHER": other_error_found = True if (error_code in {"API_ERROR_HTML", "API_ERROR_AUTH", "API_ERROR_TIMEOUT", "API_ERROR_OTHER"} or "api_error" in result or ("error" in result and "api_url" in result) or (isinstance(content_type, str) and content_type.lower().startswith("text/html"))): api_error_found = True break if api_error_found: if html_error_found: missing_reason = "API_ERROR_HTML" elif auth_error_found: missing_reason = "API_ERROR_AUTH" elif timeout_error_found: missing_reason = "API_ERROR_TIMEOUT" else: missing_reason = "API_ERROR_OTHER" if other_error_found else "API_ERROR_OTHER" else: from ..repositories.base import BaseLawRepository api_key = BaseLawRepository.get_api_key(None) if BaseLawRepository.is_placeholder_key(api_key): missing_reason = "API_ERROR_AUTH" else: missing_reason = "NO_MATCH" # API 에러 시 기본 법적 근거(정적) 제공 fallback_legal_basis = None if missing_reason == "API_ERROR": fallback_items = [] if any(k in query for k in ["근로자", "근로기준법", "프리랜서", "임금", "출퇴근", "지휘", "감독"]): fallback_items.append({ "type": "law", "title": "근로기준법 제2조 제1항 제1호(근로자 정의)", "summary": "근로자는 임금을 목적으로 사업 또는 사업장에 근로를 제공하는 자를 말합니다.", "source": "static_reference" }) fallback_items.append({ "type": "precedent", "title": "근로자성 판단 기준(대법원 판례 취지)", "summary": "계약 명칭보다 실질을 중시하고, 근무시간·장소 지정, 지휘·감독, 고정급 여부, 전속성 등을 종합 고려합니다.", "source": "static_reference" }) if any(k in query for k in ["임대차", "전세", "보증금", "임대인", "임차인", "계약서"]): fallback_items.append({ "type": "law", "title": "주택임대차보호법(보증금 반환·임차인 보호 규정)", "summary": "보증금 반환 및 임차인 보호를 위한 규정이 있으며, 계약 해지·보증금 반환 관련 쟁점이 발생할 수 있습니다.", "source": "static_reference" }) fallback_items.append({ "type": "law", "title": "민법 임대차 규정(해지·특약 효력)", "summary": "임대차 계약의 해지 요건과 특약 효력은 민법 규정 및 판례에 따라 판단됩니다.", "source": "static_reference" }) if fallback_items: fallback_legal_basis = { "items": fallback_items, "note": "API 오류로 실시간 근거를 조회하지 못해 일반적 법적 근거를 제공합니다. 실제 적용 전 확인이 필요합니다." } # 에러 정보 보존 errors = {} for search_type, result in results.items(): if isinstance(result, dict): content_type = result.get("content_type") or result.get("api_error", {}).get("content_type") if "error" in result or "api_error" in result: errors[search_type] = result elif isinstance(content_type, str) and content_type.lower().startswith("text/html"): errors[search_type] = result # citations 생성 citations = [] for search_type, result in results.items(): if isinstance(result, dict): if search_type == "law" and "law_name" in result: citations.append({ "type": "law", "id": result.get("law_id"), "name": result.get("law_name"), "source": "국가법령정보센터" }) elif search_type == "precedent" and "precedents" in result: for prec in result.get("precedents", [])[:3]: citations.append({ "type": "precedent", "id": prec.get("precedent_id"), "case_number": prec.get("case_number"), "court": prec.get("court_name"), "date": prec.get("judgment_date"), "source": "대법원/법원" }) elif search_type == "interpretation" and "interpretations" in result: for interp in result.get("interpretations", [])[:3]: citations.append({ "type": "interpretation", "id": interp.get("interpretation_id"), "agency": interp.get("agency_name"), "date": interp.get("issue_date"), "source": "정부 부처" }) # one_line_answer 생성 (근거 있을 때만) one_line_answer = None if has_legal_basis: if "law" in results and results["law"]: law_result = results["law"] if "article" in law_result: article = law_result["article"] one_line_answer = f"{law_result.get('law_name', '법령')} {article.get('article_number', '')}: {article.get('content', '')[:100]}..." elif "law_name" in law_result: one_line_answer = f"{law_result.get('law_name', '법령')} 관련 정보를 찾았습니다." elif "precedent" in results and results["precedent"]: prec_result = results["precedent"] if "precedents" in prec_result and prec_result["precedents"]: prec = prec_result["precedents"][0] one_line_answer = f"{prec.get('case_number', '')} 사건: {prec.get('case_name', '')[:100]}..." # next_questions 생성 (사실관계 질문 5개) # smart_search는 domain 정보를 직접 모르므로, query 키워드 기반으로 간단 추론 next_questions = [] query_lower = query.lower() if any(k in query for k in ["근로", "해고", "퇴직", "임금", "노동"]): # 노동/근로 관련 next_questions = [ "근로 기간은 얼마나 되나요?", "해고 사유는 무엇인가요?", "퇴직금 지급 여부는 어떻게 되나요?", "근로계약서에 명시된 내용은 무엇인가요?", "노동위원회에 신고하셨나요?" ] elif any(k in query for k in ["개인정보", "프라이버시", "신용정보"]): # 개인정보 관련 next_questions = [ "개인정보 유출 경로는 무엇인가요?", "유출된 정보의 종류는 무엇인가요?", "유출 사실을 언제 알게 되셨나요?", "개인정보보호위원회에 신고하셨나요?", "피해 규모는 어느 정도인가요?" ] elif any(k in query for k in ["세금", "소득세", "부가가치세", "종합소득세", "조세"]): # 세금/조세 관련 next_questions = [ "부과된 세금의 종류는 무엇인가요?", "세금 부과 근거는 무엇인가요?", "이의신청 기간은 언제까지인가요?", "조세심판원에 심판을 제기하셨나요?", "관련 서류는 준비되어 있나요?" ] else: # 일반적인 기본 질문 next_questions = [ "구체적인 상황을 더 자세히 설명해주세요.", "관련 서류나 증거가 있나요?", "언제부터 문제가 시작되었나요?", "관련 기관에 신고하셨나요?", "피해 규모는 어느 정도인가요?" ] legal_basis_summary = { "has_legal_basis": has_legal_basis, "types": [k for k, v in sources_count.items() if v > 0], "counts": sources_count, "missing_reason": missing_reason } # legal_basis_block_text 생성 (상단 요약용) citations_titles = [] for c in citations[:5]: if isinstance(c, dict): title = c.get("name") or c.get("case_number") or c.get("id") if title: citations_titles.append(str(title)) fallback_titles = [] if fallback_legal_basis and isinstance(fallback_legal_basis, dict): for item in fallback_legal_basis.get("items", [])[:3]: if isinstance(item, dict) and item.get("title"): fallback_titles.append(item.get("title")) if has_legal_basis: legal_basis_block_text = ( "법적 근거 요약: " f"유형={','.join(legal_basis_summary.get('types', [])) or '없음'}, " f"근거 수={sum(sources_count.values())}. " f"주요 근거={', '.join(citations_titles) if citations_titles else '없음'}" ) else: legal_basis_block_text = ( "법적 근거 요약: " f"근거를 찾지 못했습니다({missing_reason}). " f"대체 근거={', '.join(fallback_titles) if fallback_titles else '없음'}" ) response = { "success": True, "has_legal_basis": has_legal_basis, "query": query, "detected_intents": search_types, "results": results, "total_types": len(results), "successful_types": successful_types, "failed_types": failed_types if failed_types else None, "partial_success": partial_success or (successful_types and failed_types), "sources_count": sources_count, "missing_reason": missing_reason, "legal_basis_summary": legal_basis_summary, "fallback_legal_basis": fallback_legal_basis, "errors": errors, "citations": citations[:10], # 최대 10개 "one_line_answer": one_line_answer, "next_questions": next_questions[:5], # 최대 5개 "legal_basis_block_text": legal_basis_block_text, "response_policy": { "must_include": ["legal_basis_block_text", "legal_basis_block", "legal_basis_summary", "citations"], "preferred_order": ["legal_basis_block_text", "legal_basis_block", "one_line_answer"], "if_has_legal_basis_false": "no_conclusions", "when_api_error": "explain_api_error_and_request_retry" } } # 안내 메시지 추가 if partial_success or (successful_types and failed_types): if failed_types: response["note"] = f"일부 검색 타입({', '.join(failed_types)})에서 오류가 발생했지만, 다른 타입({', '.join(successful_types)})에서는 결과를 찾았습니다." else: response["note"] = f"모든 검색 타입({', '.join(successful_types)})에서 결과를 찾았습니다." elif successful_types and not failed_types: response["note"] = f"모든 검색 타입({', '.join(successful_types)})에서 성공적으로 결과를 찾았습니다." elif not successful_types and failed_types: response["note"] = f"모든 검색 타입({', '.join(failed_types)})에서 오류가 발생했습니다." return response

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/SeoNaRu/lexguard-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

smart_search_service.py•60.1 KiB