opencode 로 바꾸고 작업전 커밋

2026-05-08 17:22:10 +09:00
parent 15c17522c8
commit e923aab43b
202 changed files with 1336027 additions and 115 deletions
--- a/mcp-server/worker/nl2sql_worker.py
+++ b/mcp-server/worker/nl2sql_worker.py
@@ -73,6 +73,39 @@ PostgreSQL 시계열 데이터베이스 스키마
  livevalue   TEXT         - 현재값
  timestamp   TIMESTAMPTZ  - 최종 갱신 시각

+테이블: tag_metadata  (태그 메타데이터 - 변경 드묾)
+  base_tag    TEXT         - 기본 태그명 (예: 'ficq-6101', 'xv-6124')
+  attribute   TEXT         - 속성명 ('desc', 'area', 'state0descriptor', ...)
+  value       TEXT         - 메타데이터 값
+  node_id     TEXT         - OPC UA 노드 ID
+  loaded_at   TIMESTAMPTZ  - 마지막 로드 시각
+
+뷰: v_tag_summary  (실시간값 + 메타데이터 통합 뷰)
+  base_tag          TEXT   - 기본 태그명
+  pv                TEXT   - 현재 프로세스 값
+  sp                TEXT   - 설정값
+  op                TEXT   - 출력값
+  instate0          TEXT   - 상태 비트 0 (true/false)
+  instate1          TEXT   - 상태 비트 1 (true/false)
+  instate2          TEXT   - 상태 비트 2 (true/false)
+  description       TEXT   - 장비 설명 (tag_metadata.desc)
+  area              TEXT   - 소속 플랜트 (tag_metadata.area)
+  state0_descriptor TEXT   - 비트 0 의미 (예: "Run/Stop")
+  state1_descriptor TEXT   - 비트 1 의미 (예: "Remote/Local")
+  state2_descriptor TEXT   - 비트 2 의미 (예: "Trip/Normal")
+
+새로운 태그 타입:
+  - 아날로그: ficq-6101.pv/sp/op (Double)
+  - 디지털 XV: xv-6124.pv/op (Int32), xv-6124.instate0~7 (Boolean)
+  - Pump: p-6102.pv/op (Int32), p-6102.instate0~7 (Boolean)
+  - 메타데이터: desc (String), area (Enum), state0descriptor~7 (String)
+
+BCD 상태 조회 팁:
+  - instate0~7은 Boolean (true/false)
+  - state0descriptor~7은 해당 비트의 의미 설명
+  - instate0=true이고 state0descriptor="Run/Stop"이면 → "Run" 상태
+  - v_tag_summary 뷰를 사용하면 실시간값+메타데이터 한 번에 조회 가능
+
 N분 간격 집계 공식 (time_bucket 금지, date_trunc 사용):
  1분 버킷: date_trunc('minute', recorded_at) AS bucket
  2분 버킷: to_timestamp(FLOOR(EXTRACT(EPOCH FROM recorded_at)/120)*120) AS bucket
@@ -121,7 +154,7 @@ async def _generate_sql(natural_language: str) -> str:
    )
    
    response = await client.chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": system},
            {"role": "user", "content": natural_language},
--- a/mcp-server/worker/pid_extract_gauge.py
+++ b/mcp-server/worker/pid_extract_gauge.py
@@ -0,0 +1,62 @@
+#!/usr/bin/env python3
+"""P&ID 게이지 추출기
+
+PG, TG, LG 등 게이지 전용 추출.
+
+사용법:
+    python pid_extract_gauge.py --input full_text.txt --output gauge.json
+"""
+
+import sys
+import os
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+
+from pid_extract_template import call_llm
+from pid_extract_prompts import _GAUGE_PROMPT
+import argparse
+import json
+import logging
+import time
+
+logger = logging.getLogger("pid_extractor.gauge")
+
+def extract(input_text: str, max_tokens: int = 65536) -> list:
+    """게이지 태그 추출."""
+    return call_llm(_GAUGE_PROMPT, input_text, max_tokens=max_tokens)
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="P&ID 게이지 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수")
+    
+    args = parser.parse_args()
+    
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    t0 = time.time()
+    tags = extract(input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    print(json.dumps({"success": True, "count": len(tags), "time": round(elapsed, 1)}, ensure_ascii=False))
--- a/mcp-server/worker/pid_extract_prompts.py
+++ b/mcp-server/worker/pid_extract_prompts.py
@@ -0,0 +1,78 @@
+"""P&ID 추출기용 계측기 유형별 프롬프트 정의"""
+
+# 공통 프롬프트 헤더
+_PROMPT_HEADER = """You are a P&ID (Piping and Instrumentation Diagram) expert.
+Extract ONLY the specified instrument types from the provided DXF text.
+Return ONLY a valid JSON array. Each element must have exactly these fields:
+{"tagNo":"FCV-101","equipmentName":null,"instrumentType":"FCV","lineNumber":null,"pidDrawingNo":null,"confidence":0.95}
+
+Rules:
+- tagNo: any token matching [LETTERS]-[DIGITS] or [LETTERS]-[DIGITS]-[SUFFIX]
+- instrumentType: leading letters of tagNo
+- equipmentName: descriptive name if present near tag, else null
+- lineNumber/pidDrawingNo: null unless explicitly associated
+- confidence: 0.95 for clear tags, lower for ambiguous
+- Output ONLY the JSON array, no markdown, no explanation.
+- If no tags found, return: []
+"""
+
+# 센서/계측기: FT, FIT, LT, PT, TE, PG, LG, TG
+_SENSOR_PROMPT = _PROMPT_HEADER + """
+Extract ONLY flow transmitters (FT/FIT), level transmitters (LT), 
+pressure transmitters (PT), temperature elements (TE), 
+pressure gauges (PG), level gauges (LG), temperature gauges (TG).
+
+Target instrument types: FT, FIT, FIC, LIC, PIC, TIC, LT, PT, TE, PG, LG, TG, 
+and their variants (e.g., FIT-XXXX, FT-XXXX).
+
+Examples: FT-101, FIT-10115, PT-201, LT-301, TE-401, PG-501, LG-601, TG-701
+"""
+
+# 밸브: FCV, TCV, LCV, PCV, XV, FV, LV, PV, TV
+_VALVE_PROMPT = _PROMPT_HEADER + """
+Extract ONLY control valves and on/off valves.
+
+Target instrument types: FCV, TCV, LCV, PCV, XV, FV, LV, PV, TV,
+BCV, GV, and their variants (e.g., FCV-XXXX, PCV-XXXX, XV-XXXX).
+
+Examples: FCV-101, TCV-201, LCV-301, PCV-401, XV-501, FV-601, LV-701, PV-801
+"""
+
+# 시스템/제어기: LI, PI, TI, FIQ, FICQ, TICA, PICA, LICA
+_SYSTEM_PROMPT = _PROMPT_HEADER + """
+Extract ONLY indicating instruments, recorders, and controllers.
+
+Target instrument types: LI, PI, TI, SI, HI, FIQ, FICQ, TICA, PICA, LICA,
+FIC, LIC, PIC, TIC, and their variants.
+
+Examples: LI-101, PI-201, TI-301, FIQ-401, FICQ-501, TICA-601, PICA-701, LICA-801
+"""
+
+# 게이지: PG, TG, LG
+_GAUGE_PROMPT = _PROMPT_HEADER + """
+Extract ONLY gauges (pressure, temperature, level).
+
+Target instrument types: PG, TG, LG, SG, HG, and their variants.
+
+Examples: PG-101, TG-201, LG-301, PG-10101, TG-10201
+"""
+
+# 펌프: P-10101, VP-10117, DP-10101 등
+_PUMP_PROMPT = _PROMPT_HEADER + """
+Extract ONLY pumps and compressors.
+
+Target equipment types: P (pump), VP (vertical pump), DP (dual pump), 
+C (compressor), CP (centrifugal pump), BP (booster pump), 
+and their variants.
+
+Examples: P-10101, VP-10117, DP-10101, C-10201, CP-10301, BP-10401
+"""
+
+# 프롬프트 매핑
+PROMPTS = {
+    "sensor": _SENSOR_PROMPT,
+    "valve": _VALVE_PROMPT,
+    "system": _SYSTEM_PROMPT,
+    "gauge": _GAUGE_PROMPT,
+    "pump": _PUMP_PROMPT,
+}
--- a/mcp-server/worker/pid_extract_pump.py
+++ b/mcp-server/worker/pid_extract_pump.py
@@ -0,0 +1,62 @@
+#!/usr/bin/env python3
+"""P&ID 펌프 추출기
+
+P-10101, VP-10117, DP-10101 등 펌프/압축기 전용 추출.
+
+사용법:
+    python pid_extract_pump.py --input full_text.txt --output pump.json
+"""
+
+import sys
+import os
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+
+from pid_extract_template import call_llm
+from pid_extract_prompts import _PUMP_PROMPT
+import argparse
+import json
+import logging
+import time
+
+logger = logging.getLogger("pid_extractor.pump")
+
+def extract(input_text: str, max_tokens: int = 65536) -> list:
+    """펌프/압축기 태그 추출."""
+    return call_llm(_PUMP_PROMPT, input_text, max_tokens=max_tokens)
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="P&ID 펌프 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수")
+    
+    args = parser.parse_args()
+    
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    t0 = time.time()
+    tags = extract(input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    print(json.dumps({"success": True, "count": len(tags), "time": round(elapsed, 1)}, ensure_ascii=False))
--- a/mcp-server/worker/pid_extract_sensor.py
+++ b/mcp-server/worker/pid_extract_sensor.py
@@ -0,0 +1,67 @@
+#!/usr/bin/env python3
+"""P&ID 센서/계측기 추출기
+
+FT, FIT, LT, PT, TE, PG, LG, TG 등 센서/계측기 전용 추출.
+
+사용법:
+    python pid_extract_sensor.py --input full_text.txt --output sensor.json
+"""
+
+import sys
+import os
+
+# mcp-server/worker 디렉토리를 경로에 추가
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+
+from pid_extract_template import parse_json_array, call_llm, main as template_main
+from pid_extract_prompts import _SENSOR_PROMPT
+import argparse
+import json
+import logging
+import time
+
+logger = logging.getLogger("pid_extractor.sensor")
+
+def extract(input_text: str, max_tokens: int = 65536) -> list:
+    """센서/계측기 태그 추출."""
+    return call_llm(_SENSOR_PROMPT, input_text, max_tokens=max_tokens)
+
+if __name__ == "__main__":
+    # --prompt를 자동으로 _SENSOR_PROMPT로 설정
+    parser = argparse.ArgumentParser(description="P&ID 센서/계측기 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수")
+    
+    args = parser.parse_args()
+    
+    # 입력 읽기
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    # LLM 호출
+    t0 = time.time()
+    tags = extract(input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    # 결과 저장
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    print(json.dumps({"success": True, "count": len(tags), "time": round(elapsed, 1)}, ensure_ascii=False))
--- a/mcp-server/worker/pid_extract_system.py
+++ b/mcp-server/worker/pid_extract_system.py
@@ -0,0 +1,62 @@
+#!/usr/bin/env python3
+"""P&ID 시스템/제어기 추출기
+
+LI, PI, TI, FIQ, FICQ, TICA, PICA, LICA 등 시스템/제어기 전용 추출.
+
+사용법:
+    python pid_extract_system.py --input full_text.txt --output system.json
+"""
+
+import sys
+import os
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+
+from pid_extract_template import call_llm
+from pid_extract_prompts import _SYSTEM_PROMPT
+import argparse
+import json
+import logging
+import time
+
+logger = logging.getLogger("pid_extractor.system")
+
+def extract(input_text: str, max_tokens: int = 65536) -> list:
+    """시스템/제어기 태그 추출."""
+    return call_llm(_SYSTEM_PROMPT, input_text, max_tokens=max_tokens)
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="P&ID 시스템/제어기 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수")
+    
+    args = parser.parse_args()
+    
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    t0 = time.time()
+    tags = extract(input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    print(json.dumps({"success": True, "count": len(tags), "time": round(elapsed, 1)}, ensure_ascii=False))
--- a/mcp-server/worker/pid_extract_template.py
+++ b/mcp-server/worker/pid_extract_template.py
@@ -0,0 +1,187 @@
+#!/usr/bin/env python3
+"""P&ID 태그 추출기 공통 템플릿
+
+독립 프로세스로서 CLI에서 실행되며, 
+입력 텍스트 파일에서 P&ID 태그를 추출하여 JSON 파일로 출력합니다.
+
+사용법:
+    python pid_extract_template.py --input full_text.txt --output result.json --prompt "system prompt text"
+    python pid_extract_template.py --input full_text.txt --output result.json --prompt-file prompt.txt
+
+환경 변수:
+    VLLM_BASE_URL: vLLM 엔드포인트 (기본: http://localhost:8000/v1)
+    VLLM_MODEL: 모델명 (기본: Qwen3.6-27B-FP8)
+"""
+
+import argparse
+import json
+import logging
+import os
+import re
+import sys
+import time
+from typing import List
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s [%(name)s] %(levelname)s %(message)s",
+)
+logger = logging.getLogger("pid_extractor")
+
+
+def parse_json_array(raw: str, finish_reason: str = "") -> list:
+    """LLM 출력에서 JSON 배열 추출. finish_reason=length 잘림 복구 포함."""
+    if raw.startswith("```"):
+        lines = raw.splitlines()
+        raw = "\n".join(lines[1:-1] if lines and lines[-1].strip() == "```" else lines[1:]).strip()
+
+    if finish_reason == "length":
+        last_close = raw.rfind("}")
+        if last_close != -1:
+            raw = raw[:last_close + 1] + "]"
+
+    # 가장 긴 균형 잡힌 [...] 추출
+    depth = 0
+    start = -1
+    best = ""
+    for i, c in enumerate(raw):
+        if c == "[":
+            if depth == 0:
+                start = i
+            depth += 1
+        elif c == "]":
+            depth -= 1
+            if depth == 0 and start >= 0:
+                cand = raw[start:i + 1]
+                if len(cand) > len(best):
+                    best = cand
+    raw = best if best else "[]"
+
+    try:
+        return json.loads(raw)
+    except json.JSONDecodeError:
+        data = []
+        for obj in re.findall(r"\{[^{}]*\}", raw, re.DOTALL):
+            try:
+                data.append(json.loads(obj))
+            except json.JSONDecodeError:
+                pass
+        return data
+
+
+def call_llm(system_prompt: str, user_text: str, max_tokens: int = 65536) -> List[dict]:
+    """
+    vLLM에 LLM 호출하여 태그 목록 추출.
+    
+    Args:
+        system_prompt: 시스템 프롬프트
+        user_text: 입력 텍스트
+        max_tokens: 최대 토큰 수
+    
+    Returns:
+        추출된 태그 목록 (JSON 배열)
+    """
+    from openai import OpenAI
+    
+    base_url = os.environ.get("VLLM_BASE_URL", "http://localhost:8000/v1")
+    model = os.environ.get("VLLM_MODEL", "Qwen3.6-27B-FP8")
+    
+    client = OpenAI(base_url=base_url, api_key="dummy")
+    
+    logger.info(f"vLLM 호출: {base_url}, 모델: {model}, max_tokens: {max_tokens}")
+    logger.info(f"입력 텍스트 길이: {len(user_text)}자")
+    
+    resp = client.chat.completions.create(
+        model=model,
+        messages=[
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": user_text},
+        ],
+        max_tokens=max_tokens,
+        temperature=0.1,
+        extra_body={"chat_template_kwargs": {"enable_thinking": False}},
+    )
+    
+    raw = (resp.choices[0].message.content or "").strip()
+    finish_reason = resp.choices[0].finish_reason
+    
+    logger.info(f"LLM 응답: finish_reason={finish_reason}, 응답 길이={len(raw)}자")
+    
+    data = parse_json_array(raw, finish_reason)
+    
+    if finish_reason == "length":
+        logger.warning(f"finish_reason=length: 응답이 잘렸습니다. 복구 시도됨. 추출된 태그 수: {len(data)}")
+    
+    return data
+
+
+def main():
+    parser = argparse.ArgumentParser(description="P&ID 태그 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--prompt", type=str, default=None, help="시스템 프롬프트 (인라인)")
+    parser.add_argument("--prompt-file", type=str, default=None, help="시스템 프롬프트 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수 (기본: 65536)")
+    
+    args = parser.parse_args()
+    
+    # 1. 입력 텍스트 읽기
+    if not os.path.exists(args.input):
+        logger.error(f"입력 파일을 찾을 수 없습니다: {args.input}")
+        sys.exit(1)
+    
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    # 2. 시스템 프롬프트 읽기
+    system_prompt = None
+    if args.prompt:
+        system_prompt = args.prompt
+    elif args.prompt_file:
+        if not os.path.exists(args.prompt_file):
+            logger.error(f"프롬프트 파일을 찾을 수 없습니다: {args.prompt_file}")
+            sys.exit(1)
+        with open(args.prompt_file, "r", encoding="utf-8") as f:
+            system_prompt = f.read()
+    else:
+        logger.error("--prompt 또는 --prompt-file 중 하나를 지정해야 합니다.")
+        sys.exit(1)
+    
+    logger.info(f"시스템 프롬프트: {len(system_prompt)}자")
+    
+    # 3. LLM 호출
+    t0 = time.time()
+    tags = call_llm(system_prompt, input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    # 4. 결과 JSON 쓰기
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    
+    # 5. 요약 출력
+    print(json.dumps({
+        "success": True,
+        "count": len(tags),
+        "time": round(elapsed, 1)
+    }, ensure_ascii=False))
+
+
+if __name__ == "__main__":
+    main()
--- a/mcp-server/worker/pid_extract_valve.py
+++ b/mcp-server/worker/pid_extract_valve.py
@@ -0,0 +1,62 @@
+#!/usr/bin/env python3
+"""P&ID 밸브 추출기
+
+FCV, TCV, LCV, PCV, XV, FV, LV, PV, TV 등 밸브 전용 추출.
+
+사용법:
+    python pid_extract_valve.py --input full_text.txt --output valve.json
+"""
+
+import sys
+import os
+
+sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
+
+from pid_extract_template import call_llm
+from pid_extract_prompts import _VALVE_PROMPT
+import argparse
+import json
+import logging
+import time
+
+logger = logging.getLogger("pid_extractor.valve")
+
+def extract(input_text: str, max_tokens: int = 65536) -> list:
+    """밸브 태그 추출."""
+    return call_llm(_VALVE_PROMPT, input_text, max_tokens=max_tokens)
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="P&ID 밸브 추출기")
+    parser.add_argument("--input", required=True, help="입력 텍스트 파일 경로")
+    parser.add_argument("--output", required=True, help="출력 JSON 파일 경로")
+    parser.add_argument("--max-tokens", type=int, default=65536, help="최대 토큰 수")
+    
+    args = parser.parse_args()
+    
+    with open(args.input, "r", encoding="utf-8") as f:
+        input_text = f.read()
+    
+    logger.info(f"입력 파일 읽기 완료: {len(input_text)}자")
+    
+    t0 = time.time()
+    tags = extract(input_text, max_tokens=args.max_tokens)
+    elapsed = time.time() - t0
+    
+    logger.info(f"추출 완료: {len(tags)}개 태그, 소요 시간: {elapsed:.1f}초")
+    
+    output_dir = os.path.dirname(args.output)
+    if output_dir:
+        os.makedirs(output_dir, exist_ok=True)
+    
+    result = {
+        "success": True,
+        "count": len(tags),
+        "tags": tags,
+        "processing_time_sec": round(elapsed, 1),
+    }
+    
+    with open(args.output, "w", encoding="utf-8") as f:
+        json.dump(result, f, ensure_ascii=False, indent=2)
+    
+    logger.info(f"결과 저장 완료: {args.output}")
+    print(json.dumps({"success": True, "count": len(tags), "time": round(elapsed, 1)}, ensure_ascii=False))
--- a/mcp-server/worker/pid_worker.py
+++ b/mcp-server/worker/pid_worker.py
@@ -173,7 +173,7 @@ def _extract_pid_tags(text: str, source_type: str) -> str:
    )
    truncated = text[:100000]
    resp = _llm().chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": system},
            {"role": "user", "content": f"Source: {source_type}\n\nText:\n{truncated}"},
@@ -202,7 +202,7 @@ def _match_pid_tags(pid_tags: list, experion_tags: list) -> str:
        "- Output ONLY the JSON array.\n"
    )
    resp = _llm().chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": system},
            {"role": "user", "content": (
@@ -247,7 +247,7 @@ def _parse_pid_dxf(filepath: str) -> str:
                          ensure_ascii=False, indent=2)

    resp = _llm().chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": _TAG_EXTRACT_SYSTEM},
            {"role": "user", "content": f"Source: dxf\n\nText:\n{text[:8000]}"},
@@ -273,7 +273,7 @@ def _parse_pid_pdf(filepath: str, use_ocr: bool = True) -> str:
                          ensure_ascii=False, indent=2)

    resp = _llm().chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": _TAG_EXTRACT_SYSTEM},
            {"role": "user", "content": f"Source: pdf\n\nText:\n{text[:12000]}"},
@@ -313,92 +313,211 @@ def _parse_pid_drawing(filepath: str) -> str:

 # ── 그래프 도구 ───────────────────────────────────────────────────────────────

+import time
+
 async def _build_pid_graph_parallel(filepath: str) -> str:
+    """
+    P&ID 그래프 빌드 — 독립 프로세스 병렬 아키텍처.
+
+    Phase 1: 도면 분할 + 기하 추출
+    Phase 2: 전체 텍스트 1회 추출
+    Phase 3: 5개 독립 추출 프로세스 병렬 실행 (subprocess.Popen)
+    Phase 4: 결과 통합 + tagNo 기준 중복 제거
+    Phase 5: 위상 그래프 빌드 + 저장
+    """
    from pipeline.extractor import PidGeometricExtractor
    from pipeline.topology import PidTopologyBuilder
-    from pipeline.mapper import IntelligentMapper
-    from openai import AsyncOpenAI
+
+    import subprocess
+    import tempfile
+    import shutil

    os.makedirs(STORAGE_DIR, exist_ok=True)
+    t0 = time.time()
+    basename = os.path.basename(filepath)
+    worker_dir = os.path.dirname(os.path.abspath(__file__))
+    logging.info(f"[{basename}] === 독립 프로세스 병렬 아키텍처 시작 ===")

-    # Phase 1: 기하 추출
+    # ── Phase 1: 도면 분할 + 기하 추출 ──────────────────────────────
+    logging.info(f"[{basename}] Phase 1: 도면 분할 + 기하 추출 시작")
    extractor = PidGeometricExtractor(filepath)
-    geo_data_path = os.path.join(STORAGE_DIR, os.path.basename(filepath) + "_geo.json")
+    regions = extractor.split_drawings()
+    logging.info(f"[{basename}] 도면 분할: {len(regions)}개 영역")
+
+    geo_data_path = os.path.join(STORAGE_DIR, basename + "_geo.json")
    extractor.extract_and_save(geo_data_path)
    with open(geo_data_path, "r", encoding="utf-8") as f:
        geo_data = json.load(f)
+    logging.info(f"[{basename}] Phase 1 완료 ({time.time()-t0:.1f}s) - {len(geo_data)}개 엔티티")

-    # 시스템 태그 조회
-    system_tags: list[str] = []
-    try:
-        conn = _get_db_connection()
-        with conn.cursor() as cur:
-            cur.execute("SELECT tagname FROM realtime_table")
-            system_tags = [r[0] for r in cur.fetchall()]
-    except Exception as e:
-        logging.warning(f"시스템 태그 조회 실패: {e}")
+    # ── Phase 2: 전체 텍스트 1회 추출 ───────────────────────────────
+    t2 = time.time()
+    logging.info(f"[{basename}] Phase 2: 전체 텍스트 1회 추출")
+    full_text = _extract_text_from_dxf(filepath)
+
+    # 임시 디렉토리 생성 (프로세스 간 통신용)
+    temp_dir = tempfile.mkdtemp(prefix=f"pid_{basename.replace('.dxf', '')}_")
+    text_path = os.path.join(temp_dir, "full_text.txt")
+    with open(text_path, "w", encoding="utf-8") as f:
+        f.write(full_text)
+    logging.info(f"[{basename}] Phase 2 완료 ({time.time()-t2:.1f}s) - {len(full_text)}자")
+
+    # ── Phase 3: 5개 독립 추출 프로세스 병렬 실행 ───────────────────
+    t3 = time.time()
+    logging.info(f"[{basename}] Phase 3: 5개 독립 추출 프로세스 병렬 실행")
+
+    extractors = [
+        ("sensor", "pid_extract_sensor.py"),
+        ("valve",  "pid_extract_valve.py"),
+        ("system", "pid_extract_system.py"),
+        ("gauge",  "pid_extract_gauge.py"),
+        ("pump",   "pid_extract_pump.py"),
+    ]
+
+    results_dir = os.path.join(temp_dir, "results")
+    os.makedirs(results_dir, exist_ok=True)
+
+    processes = []
+    for name, script in extractors:
+        output_path = os.path.join(results_dir, f"{name}.json")
+        script_path = os.path.join(worker_dir, script)
+        cmd = [
+            sys.executable, script_path,
+            "--input", text_path,
+            "--output", output_path,
+        ]
+        try:
+            proc = subprocess.Popen(
+                cmd,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+                text=True,
+            )
+            processes.append((name, proc, output_path))
+            logging.info(f"[{basename}]   시작: {name} (pid={proc.pid})")
+        except Exception as e:
+            logging.error(f"[{basename}]   실행 실패 {name}: {e}")
+
+    # 모든 프로세스 대기 (timeout=300초)
+    for name, proc, output_path in processes:
+        try:
+            stdout, stderr = proc.communicate(timeout=300)
+            if proc.returncode != 0:
+                logging.error(f"[{basename}]   {name} 실패 (rc={proc.returncode}): {stderr[:200]}")
+            else:
+                logging.info(f"[{basename}]   {name} 완료: {stdout.strip()[:100]}")
+        except subprocess.TimeoutExpired:
+            proc.kill()
+            logging.error(f"[{basename}]   {name} 타임아웃 (300초)")
+
+    logging.info(f"[{basename}] Phase 3 완료 ({time.time()-t3:.1f}s)")
+
+    # ── Phase 4: 결과 JSON 통합 + tagNo 기준 중복 제거 ──────────────
+    t4 = time.time()
+    logging.info(f"[{basename}] Phase 4: 결과 통합 + 중복 제거")
+
+    all_tags = []
+    seen_tagnos = set()
+
+    for name, _, output_path in processes:
+        if not os.path.exists(output_path):
+            logging.warning(f"[{basename}]   결과 없음: {name}")
+            continue
+        try:
+            with open(output_path, "r", encoding="utf-8") as f:
+                result = json.load(f)
+            tags = result.get("tags", [])
+            count_new = 0
+            for tag in tags:
+                tag_no = tag.get("tagNo", "")
+                if tag_no and tag_no not in seen_tagnos:
+                    seen_tagnos.add(tag_no)
+                    all_tags.append(tag)
+                    count_new += 1
+            logging.info(f"[{basename}]   {name}: {len(tags)}개 중 {count_new}개 신규")
+        except Exception as e:
+            logging.error(f"[{basename}]   결과 로드 실패 {name}: {e}")
+
+    logging.info(f"[{basename}] Phase 4 완료 ({time.time()-t4:.1f}s) - 총 {len(all_tags)}개 태그")
+
+    # ── Phase 5: 위상 그래프 빌드 + 저장 ────────────────────────────
+    t5 = time.time()
+    logging.info(f"[{basename}] Phase 5: 위상 그래프 빌드")

-    # Phase 2: 1차 위상 빌더 (Mapper용 그래프)
    builder = PidTopologyBuilder(geo_data)
    builder.build_graph()

-    # Phase 3: 병렬 LLM 매핑
-    api_client = AsyncOpenAI(base_url=VLLM_BASE_URL, api_key="dummy")
-    mapper = IntelligentMapper(builder.G, system_tags, api_client=api_client)
+    # 추출된 태그를 그래프에 추가
+    from shapely.geometry import box as shapely_box
+    for tag in all_tags:
+        tag_no = tag.get("tagNo", "UNKNOWN")
+        eq_name = tag.get("equipmentName")
+        inst_type = tag.get("instrumentType")
+        confidence = tag.get("confidence", 0.5)

-    transmitter_nodes = [
-        n for n, d in builder.G.nodes(data=True)
-        if (d.get("value") or "").upper() in {"FIT", "FT", "LT", "PT", "TE"}
-    ]
-    valve_nodes = [
-        n for n, d in builder.G.nodes(data=True)
-        if (d.get("value") or "").upper() in {"FCV", "LCV", "TCV", "PCV", "XV"}
-    ]
-    equipment_nodes = [
-        n for n, d in builder.G.nodes(data=True)
-        if d.get("type") not in {"TEXT", "LINE", "LWPOLYLINE"}
-    ]
+        # 해당 태그의 bbox 찾기 (geo_data에서 clean_value 매칭)
+        matched_bbox = None
+        for entity in geo_data:
+            if entity.get("clean_value", "").upper() == tag_no.upper():
+                bbox = entity.get("bbox", {})
+                matched_bbox = (
+                    bbox.get("min_x"), bbox.get("min_y"),
+                    bbox.get("max_x"), bbox.get("max_y")
+                )
+                break

-    extracted_results = await asyncio.gather(
-        mapper.extract_transmitters(transmitter_nodes),
-        mapper.extract_valves(valve_nodes),
-        mapper.extract_equipment(equipment_nodes),
-    )
+        node_id = f"tag_{tag_no}"
+        if matched_bbox:
+            bbox_geom = shapely_box(matched_bbox[0], matched_bbox[1],
+                                     matched_bbox[2], matched_bbox[3])
+            builder.G.add_node(node_id,
+                               type="TEXT",
+                               bbox=bbox_geom,
+                               value=tag_no,
+                               equipment_name=eq_name,
+                               instrument_type=inst_type,
+                               confidence=confidence)
+        else:
+            builder.G.add_node(node_id,
+                               type="TEXT",
+                               bbox=shapely_box(0, 0, 1, 1),
+                               value=tag_no,
+                               equipment_name=eq_name,
+                               instrument_type=inst_type,
+                               confidence=confidence)

-    # 매핑 결과 통합
-    all_mapped_tags = []
-    for res_dict in extracted_results:
-        for node_id, mapping in res_dict.items():
-            if mapping.resolved_tag != "UNKNOWN":
-                node_data = builder.G.nodes[node_id]
-                all_mapped_tags.append({
-                    "entity_id": node_id,
-                    "tagName": mapping.resolved_tag,
-                    "bbox": (
-                        node_data["bbox"].bounds
-                        if hasattr(node_data["bbox"], "bounds")
-                        else node_data["bbox"]
-                    ),
-                    "clean_value": mapping.resolved_tag,
-                })
+    # 태그-설비 연결
+    equipments = [n for n, d in builder.G.nodes(data=True)
+                  if d.get("type") not in ("TEXT", "LINE", "LWPOLYLINE")]
+    if equipments:
+        eq_grid = builder._build_spatial_grid(equipments)
+        tag_ids = [f"tag_{t.get('tagNo', '')}" for t in all_tags]
+        for tag_id in tag_ids:
+            if tag_id in builder.G:
+                best_match = builder._find_nearest_equipment(tag_id, eq_grid)
+                if best_match:
+                    builder.G.add_edge(tag_id, best_match, relation="associated_with")

-    # Phase 4: 최종 위상 모델링 + 저장
-    final_builder = PidTopologyBuilder(geo_data, all_extracted_tags=all_mapped_tags)
-    final_builder.build_graph()
-
-    graph_id = os.path.basename(filepath).replace(".dxf", "_graph.json")
+    graph_id = basename.replace(".dxf", "_graph.json")
    graph_path = os.path.join(STORAGE_DIR, graph_id)
-    final_builder.save_graph(graph_path)
+    builder.save_graph(graph_path)

-    logging.info(f"build_pid_graph_parallel graph_id={graph_id} "
-                 f"nodes={final_builder.G.number_of_nodes()} "
-                 f"edges={final_builder.G.number_of_edges()}")
+    # 임시 디렉토리 정리
+    shutil.rmtree(temp_dir, ignore_errors=True)
+
+    total_time = time.time() - t0
+    logging.info(f"[{basename}] 전체 완료 ({total_time:.1f}s) - graph_id={graph_id} "
+                 f"nodes={builder.G.number_of_nodes()} "
+                 f"edges={builder.G.number_of_edges()} "
+                 f"tags={len(all_tags)}")
    return json.dumps({
        "success": True,
        "graph_id": graph_id,
        "graph_path": graph_path,
-        "nodes": final_builder.G.number_of_nodes(),
-        "edges": final_builder.G.number_of_edges(),
+        "nodes": builder.G.number_of_nodes(),
+        "edges": builder.G.number_of_edges(),
+        "tags_extracted": len(all_tags),
+        "processing_time_sec": round(total_time, 1)
    }, ensure_ascii=False)


--- a/mcp-server/worker/pid_worker_test.py
+++ b/mcp-server/worker/pid_worker_test.py
@@ -0,0 +1,609 @@
+#!/usr/bin/env python3
+"""P&ID 파싱 전용 워커 프로세스 (테스트용 - 절대 경로 지원)
+
+Usage: python pid_worker_test.py <port>
+
+담당 도구:
+  extract_pid_tags, match_pid_tags,
+  parse_pid_dxf, parse_pid_pdf, parse_pid_drawing,
+  build_pid_graph_parallel, analyze_pid_impact
+"""
+
+from __future__ import annotations
+import sys
+import os
+
+# 프로젝트 루트를 Python 경로에 추가
+PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+sys.path.insert(0, PROJECT_ROOT)
+
+import io
+import json
+import asyncio
+import signal
+import logging
+import re
+from functools import lru_cache
+
+from fastapi import FastAPI, Request, BackgroundTasks
+import uvicorn
+
+# ── 설정 ─────────────────────────────────────────────────────────────────────
+
+VLLM_BASE_URL        = os.environ.get("VLLM_BASE_URL", "http://localhost:8000/v1")
+VLLM_MODEL           = os.environ.get("VLLM_MODEL", "Qwen3.6-27B-FP8")
+DB_CONNECTION_STRING = os.environ.get("DB_CONNECTION_STRING", "postgresql://postgres:postgres@localhost:5432/iiot_platform")
+DB_TIMEOUT           = int(os.environ.get("DB_TIMEOUT", "10"))
+
+_SERVER_DIR = PROJECT_ROOT
+STORAGE_DIR = os.path.join(_SERVER_DIR, "storage")
+
+logging.basicConfig(
+    level=logging.INFO,
+    stream=sys.stderr,
+    format="%(asctime)s [pid_worker] %(levelname)s %(message)s",
+)
+
+app = FastAPI()
+
+# ── 싱글톤 ───────────────────────────────────────────────────────────────────
+
+@lru_cache(maxsize=1)
+def _llm():
+    from openai import OpenAI
+    return OpenAI(base_url=VLLM_BASE_URL, api_key="dummy")
+
+
+@lru_cache(maxsize=1)
+def _ocr():
+    from paddleocr import PaddleOCR
+    use_gpu = os.environ.get("PADDLE_USE_GPU", "true").lower() == "true"
+    try:
+        return PaddleOCR(use_angle_cls=True, lang="korean", use_gpu=use_gpu, show_log=False)
+    except Exception:
+        if use_gpu:
+            os.environ["PADDLE_USE_GPU"] = "false"
+            return _ocr()
+        raise
+
+# ── DB ───────────────────────────────────────────────────────────────────────
+
+def _get_db_connection():
+    import psycopg
+    return psycopg.connect(DB_CONNECTION_STRING, connect_timeout=DB_TIMEOUT)
+
+# ── 텍스트 추출 ──────────────────────────────────────────────────────────────
+
+def _extract_text_from_dxf(filepath: str) -> str:
+    import ezdxf
+    from ezdxf.tools.text import plain_mtext
+    doc = ezdxf.readfile(filepath)
+    msp = doc.modelspace()
+    texts = []
+    for entity in msp:
+        if entity.dxftype() == "TEXT":
+            texts.append(entity.dxf.text)
+        elif entity.dxftype() == "MTEXT":
+            try:
+                plain = plain_mtext(entity.dxf.text)
+                if plain.strip():
+                    texts.append(plain)
+            except Exception:
+                pass
+    return "\n".join(texts)
+
+
+def _extract_text_from_pdf(filepath: str) -> str:
+    import fitz
+    doc = fitz.open(filepath)
+    return "\n".join(page.get_text() for page in doc)
+
+
+def _extract_text_from_pdf_ocr(filepath: str) -> str:
+    import fitz
+    from PIL import Image
+    import numpy as np
+    doc = fitz.open(filepath)
+    all_texts = []
+    for page in doc:
+        mat = fitz.Matrix(300 / 72)
+        pix = page.get_pixmap(matrix=mat)
+        img = Image.open(io.BytesIO(pix.tobytes("png")))
+        result = _ocr().ocr(np.array(img), cls=True)
+        if result and result[0]:
+            all_texts.extend(line[1][0] for line in result[0])
+    return "\n".join(all_texts)
+
+# ── JSON 배열 파싱 유틸 ───────────────────────────────────────────────────────
+
+def _parse_json_array(raw: str, finish_reason: str = "") -> list:
+    """LLM 출력에서 JSON 배열 추출. finish_reason=length 잘림 복구 포함."""
+    if raw.startswith("```"):
+        lines = raw.splitlines()
+        raw = "\n".join(lines[1:-1] if lines and lines[-1].strip() == "```" else lines[1:]).strip()
+
+    if finish_reason == "length":
+        last_close = raw.rfind("}")
+        if last_close != -1:
+            raw = raw[:last_close + 1] + "]"
+
+    # 가장 긴 균형 잡힌 [...] 추출
+    depth = 0; start = -1; best = ""
+    for i, c in enumerate(raw):
+        if c == "[":
+            if depth == 0:
+                start = i
+            depth += 1
+        elif c == "]":
+            depth -= 1
+            if depth == 0 and start >= 0:
+                cand = raw[start:i + 1]
+                if len(cand) > len(best):
+                    best = cand
+    raw = best if best else "[]"
+
+    try:
+        return json.loads(raw)
+    except json.JSONDecodeError:
+        data = []
+        for obj in re.findall(r"\{[^{}]*\}", raw, re.DOTALL):
+            try:
+                data.append(json.loads(obj))
+            except json.JSONDecodeError:
+                pass
+        return data
+
+# ── 태그 추출/매핑 도구 ───────────────────────────────────────────────────────
+
+def _extract_pid_tags(text: str, source_type: str) -> str:
+    system = (
+        "You are a P&ID (Piping and Instrumentation Diagram) expert.\n"
+        "Extract all instrument and equipment tags from the provided text.\n"
+        "Return ONLY a valid JSON array. Each element must have exactly these fields:\n"
+        '{"tagNo":"FCV-101","equipmentName":null,"instrumentType":"FCV",'
+        '"lineNumber":null,"pidDrawingNo":null,"confidence":0.95}\n'
+        "Rules:\n"
+        "- tagNo: any token matching [LETTERS]-[DIGITS] or [LETTERS]-[DIGITS]-[SUFFIX]\n"
+        "  Examples: FCV-101, P-10101, T-10100, VG-6203-15A-F1A-n, BT-6200, DP-10101\n"
+        "- instrumentType: leading letters of tagNo\n"
+        "- equipmentName: descriptive name if present near tag, else null\n"
+        "- lineNumber/pidDrawingNo: null unless explicitly associated\n"
+        "- confidence: 0.95 for clear tags, lower for ambiguous\n"
+        "- Output ONLY the JSON array, no markdown, no explanation.\n"
+        "- If no tags found, return: []\n"
+    )
+    truncated = text[:100000]
+    resp = _llm().chat.completions.create(
+        model="Qwen3.6-27B-FP8",
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": f"Source: {source_type}\n\nText:\n{truncated}"},
+        ],
+        max_tokens=32768,
+        temperature=0.1,
+        extra_body={"chat_template_kwargs": {"enable_thinking": False}},
+    )
+    raw = (resp.choices[0].message.content or "").strip()
+    data = _parse_json_array(raw, resp.choices[0].finish_reason)
+    logging.info(f"extract_pid_tags source={source_type} count={len(data)}")
+    return json.dumps({
+        "success": True,
+        "data": {"count": len(data), "tags": data},
+        "message": "태그 추출 완료"
+    }, ensure_ascii=False, indent=2)
+
+
+def _match_pid_tags(pid_tags: list, experion_tags: list) -> str:
+    system = (
+        "You are a P&ID to Experion tag matching expert.\n"
+        "Match P&ID tags to Experion tags based on similarity.\n"
+        "Return ONLY a JSON array:\n"
+        '[{"pidTag":"FT-101","experionTag":"ft-101.pv","confidence":0.92},...]\n'
+        "- If no good match: confidence < 0.5, experionTag null\n"
+        "- Output ONLY the JSON array.\n"
+    )
+    resp = _llm().chat.completions.create(
+        model="Qwen3.6-27B-FP8",
+        messages=[
+            {"role": "system", "content": system},
+            {"role": "user", "content": (
+                f"P&ID Tags:\n{chr(10).join(pid_tags)}\n\n"
+                f"Experion Tags:\n{chr(10).join(experion_tags)}"
+            )},
+        ],
+        max_tokens=16384,
+        temperature=0.1,
+        extra_body={"chat_template_kwargs": {"enable_thinking": False}},
+    )
+    raw = (resp.choices[0].message.content or "").strip()
+    data = _parse_json_array(raw, resp.choices[0].finish_reason)
+    return json.dumps({
+        "success": True,
+        "data": {"count": len(data), "mappings": data},
+        "message": "태그 매핑 완료"
+    }, ensure_ascii=False, indent=2)
+
+# ── 도면 파싱 도구 ────────────────────────────────────────────────────────────
+
+_TAG_EXTRACT_SYSTEM = (
+    "You are a P&ID (Piping and Instrumentation Diagram) expert.\n"
+    "Extract instrument and equipment tags from the provided text.\n"
+    "Return ONLY a JSON array:\n"
+    '[{"tagNo":"FIT-10115","equipmentName":"Flow Transmitter","instrumentType":"FIT",'
+    '"lineNumber":"L-101","pidDrawingNo":"P&ID-001","confidence":0.95},...]\n'
+    "Rules:\n"
+    "- tagNo: Instrument [Function]-[Number], Equipment [Type]-[Number]\n"
+    "- instrumentType: first 2-4 letters of tagNo\n"
+    "- equipmentName/lineNumber/pidDrawingNo: null if not present\n"
+    "- confidence: 0.0 to 1.0\n"
+    "- Output ONLY the JSON array, no markdown.\n"
+    "- If no tags found, return: []\n"
+)
+
+
+def _parse_pid_dxf(filepath: str) -> str:
+    text = _extract_text_from_dxf(filepath)
+    if not text.strip():
+        return json.dumps({"success": True, "text": "", "count": 0, "tags": []},
+                          ensure_ascii=False, indent=2)
+
+    resp = _llm().chat.completions.create(
+        model="Qwen3.6-27B-FP8",
+        messages=[
+            {"role": "system", "content": _TAG_EXTRACT_SYSTEM},
+            {"role": "user", "content": f"Source: dxf\n\nText:\n{text[:8000]}"},
+        ],
+        max_tokens=8192,
+        temperature=0.1,
+    )
+    raw = (resp.choices[0].message.content or "").strip()
+    data = _parse_json_array(raw, resp.choices[0].finish_reason)
+    if not isinstance(data, list):
+        data = []
+    return json.dumps({
+        "success": True,
+        "data": {"text": text[:10000], "count": len(data), "tags": data},
+        "message": "DXF 파싱 완료"
+    }, ensure_ascii=False, indent=2)
+
+
+def _parse_pid_pdf(filepath: str, use_ocr: bool = True) -> str:
+    text = _extract_text_from_pdf_ocr(filepath) if use_ocr else _extract_text_from_pdf(filepath)
+    if not text.strip():
+        return json.dumps({"success": True, "text": "", "count": 0, "tags": []},
+                          ensure_ascii=False, indent=2)
+
+    resp = _llm().chat.completions.create(
+        model="Qwen3.6-27B-FP8",
+        messages=[
+            {"role": "system", "content": _TAG_EXTRACT_SYSTEM},
+            {"role": "user", "content": f"Source: pdf\n\nText:\n{text[:12000]}"},
+        ],
+        max_tokens=4096,
+        temperature=0.1,
+    )
+    raw = (resp.choices[0].message.content or "").strip()
+    data = _parse_json_array(raw, resp.choices[0].finish_reason)
+    if not isinstance(data, list):
+        data = []
+    return json.dumps({
+        "success": True,
+        "data": {"text": text[:10000], "count": len(data), "tags": data},
+        "message": "PDF 파싱 완료"
+    }, ensure_ascii=False, indent=2)
+
+
+def _parse_pid_drawing(filepath: str) -> str:
+    ext = os.path.splitext(filepath)[1].lower()
+    if ext == ".dxf":
+        return _parse_pid_dxf(filepath)
+    elif ext == ".pdf":
+        return _parse_pid_pdf(filepath)
+    elif ext == ".dwg":
+        return json.dumps({
+            "success": False,
+            "data": None,
+            "error": "DWG 파일은 직접 파싱할 수 없습니다. DXF로 변환 후 사용하세요.",
+            "message": "지원하지 않는 파일 형식"
+        }, ensure_ascii=False)
+    else:
+        return json.dumps({
+            "success": False,
+            "error": f"지원하지 않는 형식: {ext}. 지원: .dxf, .pdf",
+        }, ensure_ascii=False)
+
+# ── 그래프 도구 ───────────────────────────────────────────────────────────────
+
+import time
+
+async def _build_pid_graph_parallel(filepath: str) -> str:
+    """
+    P&ID 그래프 빌드 — 독립 프로세스 병렬 아키텍처.
+
+    Phase 1: 도면 분할 + 기하 추출
+    Phase 2: 전체 텍스트 1회 추출
+    Phase 3: 5개 독립 추출 프로세스 병렬 실행 (subprocess.Popen)
+    Phase 4: 결과 통합 + tagNo 기준 중복 제거
+    Phase 5: 위상 그래프 빌드 + 저장
+    """
+    from pipeline.extractor import PidGeometricExtractor
+    from pipeline.topology import PidTopologyBuilder
+
+    import subprocess
+    import tempfile
+    import shutil
+
+    os.makedirs(STORAGE_DIR, exist_ok=True)
+    t0 = time.time()
+    # 절대 경로로 변환하여 파일 경로 문제 해결
+    if not os.path.isabs(filepath):
+        filepath = os.path.join(PROJECT_ROOT, filepath)
+    filepath = os.path.abspath(filepath)
+    basename = os.path.basename(filepath)
+    worker_dir = os.path.join(PROJECT_ROOT, "mcp-server", "worker")
+    logging.info(f"[{basename}] === 독립 프로세스 병렬 아키텍처 시작 ===")
+
+    # ── Phase 1: 도면 분할 + 기하 추출 ──────────────────────────────
+    logging.info(f"[{basename}] Phase 1: 도면 분할 + 기하 추출 시작")
+    extractor = PidGeometricExtractor(filepath)
+    regions = extractor.split_drawings()
+    logging.info(f"[{basename}] 도면 분할: {len(regions)}개 영역")
+
+    geo_data_path = os.path.join(STORAGE_DIR, basename + "_geo.json")
+    extractor.extract_and_save(geo_data_path)
+    with open(geo_data_path, "r", encoding="utf-8") as f:
+        geo_data = json.load(f)
+    logging.info(f"[{basename}] Phase 1 완료 ({time.time()-t0:.1f}s) - {len(geo_data)}개 엔티티")
+
+    # ── Phase 2: 전체 텍스트 1회 추출 ───────────────────────────────
+    t2 = time.time()
+    logging.info(f"[{basename}] Phase 2: 전체 텍스트 1회 추출")
+    full_text = _extract_text_from_dxf(filepath)
+
+    # 임시 디렉토리 생성 (프로세스 간 통신용)
+    temp_dir = tempfile.mkdtemp(prefix=f"pid_{basename.replace('.dxf', '')}_")
+    text_path = os.path.join(temp_dir, "full_text.txt")
+    with open(text_path, "w", encoding="utf-8") as f:
+        f.write(full_text)
+    logging.info(f"[{basename}] Phase 2 완료 ({time.time()-t2:.1f}s) - {len(full_text)}자")
+
+    # ── Phase 3: 5개 독립 추출 프로세스 병렬 실행 ───────────────────
+    t3 = time.time()
+    logging.info(f"[{basename}] Phase 3: 5개 독립 추출 프로세스 병렬 실행")
+
+    extractors = [
+        ("sensor", "pid_extract_sensor.py"),
+        ("valve",  "pid_extract_valve.py"),
+        ("system", "pid_extract_system.py"),
+        ("gauge",  "pid_extract_gauge.py"),
+        ("pump",   "pid_extract_pump.py"),
+    ]
+
+    results_dir = os.path.join(temp_dir, "results")
+    os.makedirs(results_dir, exist_ok=True)
+
+    processes = []
+    for name, script in extractors:
+        output_path = os.path.join(results_dir, f"{name}.json")
+        script_path = os.path.join(worker_dir, script)
+        cmd = [
+            sys.executable, script_path,
+            "--input", text_path,
+            "--output", output_path,
+        ]
+        try:
+            proc = subprocess.Popen(
+                cmd,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+                text=True,
+            )
+            processes.append((name, proc, output_path))
+            logging.info(f"[{basename}]   시작: {name} (pid={proc.pid})")
+        except Exception as e:
+            logging.error(f"[{basename}]   실행 실패 {name}: {e}")
+
+    # 모든 프로세스 대기 (timeout=300초)
+    for name, proc, output_path in processes:
+        try:
+            stdout, stderr = proc.communicate(timeout=300)
+            if proc.returncode != 0:
+                logging.error(f"[{basename}]   {name} 실패 (rc={proc.returncode}): {stderr[:200]}")
+            else:
+                logging.info(f"[{basename}]   {name} 완료: {stdout.strip()[:100]}")
+        except subprocess.TimeoutExpired:
+            proc.kill()
+            logging.error(f"[{basename}]   {name} 타임아웃 (300초)")
+
+    logging.info(f"[{basename}] Phase 3 완료 ({time.time()-t3:.1f}s)")
+
+    # ── Phase 4: 결과 JSON 통합 + tagNo 기준 중복 제거 ──────────────
+    t4 = time.time()
+    logging.info(f"[{basename}] Phase 4: 결과 통합 + 중복 제거")
+
+    all_tags = []
+    seen_tagnos = set()
+
+    for name, _, output_path in processes:
+        if not os.path.exists(output_path):
+            logging.warning(f"[{basename}]   결과 없음: {name}")
+            continue
+        try:
+            with open(output_path, "r", encoding="utf-8") as f:
+                result = json.load(f)
+            tags = result.get("tags", [])
+            count_new = 0
+            for tag in tags:
+                tag_no = tag.get("tagNo", "")
+                if tag_no and tag_no not in seen_tagnos:
+                    seen_tagnos.add(tag_no)
+                    all_tags.append(tag)
+                    count_new += 1
+            logging.info(f"[{basename}]   {name}: {len(tags)}개 중 {count_new}개 신규")
+        except Exception as e:
+            logging.error(f"[{basename}]   결과 로드 실패 {name}: {e}")
+
+    logging.info(f"[{basename}] Phase 4 완료 ({time.time()-t4:.1f}s) - 총 {len(all_tags)}개 태그")
+
+    # ── Phase 5: 위상 그래프 빌드 + 저장 ────────────────────────────
+    t5 = time.time()
+    logging.info(f"[{basename}] Phase 5: 위상 그래프 빌드")
+
+    builder = PidTopologyBuilder(geo_data)
+    builder.build_graph()
+
+    # 추출된 태그를 그래프에 추가
+    from shapely.geometry import box as shapely_box
+    for tag in all_tags:
+        tag_no = tag.get("tagNo", "UNKNOWN")
+        eq_name = tag.get("equipmentName")
+        inst_type = tag.get("instrumentType")
+        confidence = tag.get("confidence", 0.5)
+
+        # 해당 태그의 bbox 찾기 (geo_data에서 clean_value 매칭)
+        matched_bbox = None
+        for entity in geo_data:
+            if entity.get("clean_value", "").upper() == tag_no.upper():
+                bbox = entity.get("bbox", {})
+                matched_bbox = (
+                    bbox.get("min_x"), bbox.get("min_y"),
+                    bbox.get("max_x"), bbox.get("max_y")
+                )
+                break
+
+        node_id = f"tag_{tag_no}"
+        if matched_bbox:
+            bbox_geom = shapely_box(matched_bbox[0], matched_bbox[1],
+                                     matched_bbox[2], matched_bbox[3])
+            builder.G.add_node(node_id,
+                               type="TEXT",
+                               bbox=bbox_geom,
+                               value=tag_no,
+                               equipment_name=eq_name,
+                               instrument_type=inst_type,
+                               confidence=confidence)
+        else:
+            builder.G.add_node(node_id,
+                               type="TEXT",
+                               bbox=shapely_box(0, 0, 1, 1),
+                               value=tag_no,
+                               equipment_name=eq_name,
+                               instrument_type=inst_type,
+                               confidence=confidence)
+
+    # 태그-설비 연결
+    equipments = [n for n, d in builder.G.nodes(data=True)
+                  if d.get("type") not in ("TEXT", "LINE", "LWPOLYLINE")]
+    if equipments:
+        eq_grid = builder._build_spatial_grid(equipments)
+        tag_ids = [f"tag_{t.get('tagNo', '')}" for t in all_tags]
+        for tag_id in tag_ids:
+            if tag_id in builder.G:
+                best_match = builder._find_nearest_equipment(tag_id, eq_grid)
+                if best_match:
+                    builder.G.add_edge(tag_id, best_match, relation="associated_with")
+
+    graph_id = basename.replace(".dxf", "_graph.json")
+    graph_path = os.path.join(STORAGE_DIR, graph_id)
+    builder.save_graph(graph_path)
+
+    # 임시 디렉토리 정리
+    shutil.rmtree(temp_dir, ignore_errors=True)
+
+    total_time = time.time() - t0
+    logging.info(f"[{basename}] 전체 완료 ({total_time:.1f}s) - graph_id={graph_id} "
+                 f"nodes={builder.G.number_of_nodes()} "
+                 f"edges={builder.G.number_of_edges()} "
+                 f"tags={len(all_tags)}")
+    return json.dumps({
+        "success": True,
+        "graph_id": graph_id,
+        "graph_path": graph_path,
+        "nodes": builder.G.number_of_nodes(),
+        "edges": builder.G.number_of_edges(),
+        "tags_extracted": len(all_tags),
+        "processing_time_sec": round(total_time, 1)
+    }, ensure_ascii=False)
+
+
+def _analyze_pid_impact(graph_id: str, start_node_id: str) -> str:
+    from pipeline.analyzer import PidAnalysisEngine
+
+    graph_path = os.path.join(STORAGE_DIR, graph_id)
+    mapping_path = graph_path.replace("_graph.json", "_mapping.json")
+    analyzer = PidAnalysisEngine(graph_path, mapping_path)
+    result = analyzer.analyze_impact(start_node_id)
+    return json.dumps(result, ensure_ascii=False, indent=2)
+
+# ── 요청 디스패처 ─────────────────────────────────────────────────────────────
+
+async def _dispatch(tool: str, params: dict) -> str:
+    try:
+        match tool:
+            # blocking 함수는 asyncio.to_thread로 스레드풀 오프로드
+            case "extract_pid_tags":
+                return await asyncio.to_thread(_extract_pid_tags, **params)
+            case "match_pid_tags":
+                return await asyncio.to_thread(_match_pid_tags, **params)
+            case "parse_pid_dxf":
+                return await asyncio.to_thread(_parse_pid_dxf, **params)
+            case "parse_pid_pdf":
+                return await asyncio.to_thread(_parse_pid_pdf, **params)
+            case "parse_pid_drawing":
+                return await asyncio.to_thread(_parse_pid_drawing, **params)
+            case "analyze_pid_impact":
+                return await asyncio.to_thread(_analyze_pid_impact, **params)
+            # 이미 async — 직접 await
+            case "build_pid_graph_parallel":
+                return await _build_pid_graph_parallel(**params)
+            case _:
+                return json.dumps({"success": False, "error": f"알 수 없는 도구: {tool}"},
+                                  ensure_ascii=False)
+    except Exception as e:
+        logging.error(f"dispatch error tool={tool}: {e}", exc_info=True)
+        return json.dumps({"success": False, "error": str(e)}, ensure_ascii=False)
+
+# ── 종료 예약 ─────────────────────────────────────────────────────────────────
+
+def _schedule_shutdown():
+    """
+    응답 전송 완료 후 프로세스 종료 예약.
+    FastAPI의 BackgroundTasks를 사용하여 응답이 완전히 전송된 후 종료되도록 유도함.
+    """
+    async def _do():
+        # 네트워크 전송 및 커넥션 정리를 위한 최소한의 대기 시간
+        await asyncio.sleep(1.0)
+        logging.info("One-shot worker shutting down...")
+        os.kill(os.getpid(), signal.SIGTERM)
+    asyncio.create_task(_do())
+
+# ── HTTP 엔드포인트 ───────────────────────────────────────────────────────────
+
+@app.get("/health")
+async def health():
+    return {"status": "ok"}
+
+
+@app.post("/execute")
+async def execute(request: Request):
+    body = await request.json()
+    return await _dispatch(body["tool"], body["params"])
+
+
+@app.post("/execute/one_shot")
+async def execute_one_shot(request: Request, background_tasks: BackgroundTasks):
+    """요청 처리 후 프로세스 자동 종료 (P&ID 워커 전용)."""
+    body = await request.json()
+    result = await _dispatch(body["tool"], body["params"])
+    
+    # BackgroundTasks에 등록하여 응답 전송이 완료된 후 _schedule_shutdown이 실행되도록 함
+    background_tasks.add_task(_schedule_shutdown)
+    
+    return result
+
+# ── 진입점 ───────────────────────────────────────────────────────────────────
+
+if __name__ == "__main__":
+    port = int(sys.argv[1]) if len(sys.argv) > 1 else 5005
+    os.makedirs(STORAGE_DIR, exist_ok=True)
+    uvicorn.run(app, host="0.0.0.0", port=port, log_level="warning")
--- a/mcp-server/worker/rag_worker.py
+++ b/mcp-server/worker/rag_worker.py
@@ -105,7 +105,7 @@ async def _ask_llm(question: str, context: str = "") -> str:
        prompt = question
    
    response = await client.chat.completions.create(
-        model=VLLM_MODEL,
+        model="Qwen3.6-27B-FP8",
        messages=[
            {"role": "system", "content": "You are a helpful assistant."},
            {"role": "user", "content": prompt},