Initial Commit

2025-03-18 04:34:57 +00:00
commit a4981faeef
60 changed files with 2160 additions and 0 deletions
--- a/.dockerignore
+++ b/.dockerignore
@@ -0,0 +1,5 @@
 __pycache__/
 *.pyc
 *.pyo
 *.pyd
 projects/
--- a/32
+++ b/32
@@ -0,0 +1,32 @@
 # Base stage: Install common dependencies
 FROM python:3.10-slim AS base
 # Set working directory and environment variables
 WORKDIR /usr/src/app
 ENV PYTHONUNBUFFERED=1 \
    PYTHONDONTWRITEBYTECODE=1 \
    PIP_NO_CACHE_DIR=1
 # Copy only requirements files first to leverage Docker cache
 COPY pyproject.toml ./ 
 # Install system and Python dependencies in a single layer
 RUN apt-get update && \
    apt-get install -y --no-install-recommends \
    build-essential \
    gcc \
    libssl-dev && \
    pip install --no-cache-dir --upgrade pip setuptools setuptools-scm && \
    rm -rf /var/lib/apt/lists/* 
 # Copy project files
 COPY autorag /usr/src/app/autorag
 COPY dashboard.sh /usr/src/app/dashboard.sh
 # Install base project
 RUN pip install -r requirements.txt
 # Set permissions for dashboard script
 RUN chmod +x /usr/src/app/dashboard.sh
 CMD ["bash", "dashboard.sh"]
--- a/README.md
+++ b/README.md
@@ -0,0 +1,70 @@
 # 📊 AutoRAG Dashboard
 AutoRAG Dashboard는 실험 결과를 시각화하여 분석할 수 있는 웹 기반 대시보드입니다.  
 ---
 ## **🚀 주요 기능**
 ### ✅ **1. 실험 결과 요약**
 - **실험 폴더 (`trial_dir`)를 자동으로 분석**하여 실험 결과를 요약합니다.
 - `summary.csv`를 기반으로 가장 성능이 좋은 모듈을 자동으로 선택합니다.
 - 실험에 사용된 설정 파일(`config.yaml`)을 Markdown 형식으로 출력합니다.
 ### ✅ **2. 실험별 성능 비교**
 - Stripplot 및 Boxplot을 제공하여 **모듈별 성능 분포를 시각적으로 비교**할 수 있습니다.
 - 성능 비교를 통해 실험 결과를 더욱 직관적으로 이해할 수 있습니다.
 ### ✅ **3. 개별 쿼리 조회**
 - `detail` 버튼을 클릭하여 쿼리 별로 자세한 정보를를 제공합니다.
 ---
 ## **📥 설치 및 실행 방법**
 ### **1️⃣ Docker 컨테이너 실행 (권장)**
 AutoRAG Dashboard는 Docker 환경에서 쉽게 실행할 수 있습니다.
 ```bash
 # 1. Docker 컨테이너 빌드
 docker compose build
 # 2. AutoRAG Dashboard 실행
 docker compose up
 ```
 브라우저에서 [http://localhost:7690](http://localhost:7690)로 접속하여 대시보드를 확인하세요.
 ---
 ## **📂 프로젝트 구조**
 ```bash
 .
 ├── autorag
 │   ├── cli.py          # 대시보드 실행을 위한 CLI
 │   ├── dashboard.py    # 대시보드 메인 로직
 │   ├── schema/
 │   ├── utils/
 │   ├── VERSION
 ├── dashboard.sh        # Docker 환경에서 실행되는 스크립트
 ├── docker-compose.yml  # Docker 설정 파일
 ├── Dockerfile          # Docker 빌드 파일
 ├── pyproject.toml      # Python 패키지 설정
 ├── requirements.txt    # 필수 패키지 목록
 └── projects/           # 실험 결과 저장 폴더 (볼륨 마운트)
 ```
 ---
 ## **📌 추가 설정**
 ### **📍 포트 변경**
 기본적으로 **7690번 포트**에서 실행됩니다.  
 포트를 변경하려면 `docker-compose.yml`에서 아래 내용을 수정하세요.
 ```yaml
    ports:
      - "7690:7690"  # 변경하고 싶은 포트로 수정 가능
 ```
 ### **📍 실험 데이터 경로 변경**
 실험 결과 폴더(`trial_dir`)의 기본 위치는 `./projects/benchmark_sample`입니다.  
 다른 폴더를 사용하려면 실행 시 `--trial_dir` 옵션 경로를 수정하세요.
 ```bash
 python3 -m autorag.cli dashboard --trial_dir ./projects/custom_experiment
 ```
--- a/autorag/VERSION
+++ b/autorag/VERSION
@@ -0,0 +1 @@
 0.3.14
--- a/autorag/init.py
+++ b/autorag/init.py
@@ -0,0 +1,113 @@
 import logging
 import logging.config
 import os
 import sys
 from random import random
 from typing import List, Any
 from llama_index.core.embeddings.mock_embed_model import MockEmbedding
 from llama_index.core.base.llms.types import CompletionResponse
 from llama_index.core.llms.mock import MockLLM
 from llama_index.llms.bedrock import Bedrock
 from llama_index.embeddings.openai import OpenAIEmbedding
 from llama_index.embeddings.openai import OpenAIEmbeddingModelType
 from llama_index.llms.openai import OpenAI
 from llama_index.llms.openai_like import OpenAILike
 from langchain_openai.embeddings import OpenAIEmbeddings
 from rich.logging import RichHandler
 from llama_index.llms.ollama import Ollama
 version_path = os.path.join(os.path.dirname(os.path.realpath(__file__)), "VERSION")
 with open(version_path, "r") as f:
 	__version__ = f.read().strip()
 class LazyInit:
 	def __init__(self, factory, *args, **kwargs):
 		self._factory = factory
 		self._args = args
 		self._kwargs = kwargs
 		self._instance = None
 	def __call__(self):
 		if self._instance is None:
 			self._instance = self._factory(*self._args, **self._kwargs)
 		return self._instance
 	def __getattr__(self, name):
 		if self._instance is None:
 			self._instance = self._factory(*self._args, **self._kwargs)
 		return getattr(self._instance, name)
 rich_format = "[%(filename)s:%(lineno)s] >> %(message)s"
 logging.basicConfig(
 	level="INFO", format=rich_format, handlers=[RichHandler(rich_tracebacks=True)]
 )
 logger = logging.getLogger("AutoRAG")
 def handle_exception(exc_type, exc_value, exc_traceback):
 	logger = logging.getLogger("AutoRAG")
 	logger.error("Unexpected exception", exc_info=(exc_type, exc_value, exc_traceback))
 sys.excepthook = handle_exception
 class AutoRAGBedrock(Bedrock):
 	async def acomplete(
 		self, prompt: str, formatted: bool = False, **kwargs: Any
 	) -> CompletionResponse:
 		return self.complete(prompt, formatted=formatted, **kwargs)
 generator_models = {
 	"openai": OpenAI,
 	"openailike": OpenAILike,
 	"mock": MockLLM,
 	"bedrock": AutoRAGBedrock,
 	"ollama": Ollama,
 }
 # embedding_models = {
 # }
 try:
 	from llama_index.llms.huggingface import HuggingFaceLLM
 	from llama_index.llms.ollama import Ollama
 	generator_models["huggingfacellm"] = HuggingFaceLLM
 	generator_models["ollama"] = Ollama
 except ImportError:
 	logger.info(
 		"You are using API version of AutoRAG. "
 		"To use local version, run pip install 'AutoRAG[gpu]'"
 	)
 # try:
 # 	from llama_index.embeddings.huggingface import HuggingFaceEmbedding
 # 	embedding_models["hf_all_mpnet_base_v2"] = HuggingFaceEmbedding # 250312 변경 - 김용연
 # 	embedding_models["hf_KURE-v1"] = HuggingFaceEmbedding # 250312 변경 - 김용연
 # 	embedding_models["hf_snowflake-arctic-embed-l-v2.0-ko"] = HuggingFaceEmbedding # 250313 변경 - 김용연
 # except ImportError:
 # 	logger.info(
 # 		"You are using API version of AutoRAG."
 # 		"To use local version, run pip install 'AutoRAG[gpu]'"
 # 	)
 try:
 	import transformers
 	transformers.logging.set_verbosity_error()
 except ImportError:
 	logger.info(
 		"You are using API version of AutoRAG."
 		"To use local version, run pip install 'AutoRAG[gpu]'"
 	)
--- a/autorag/cli.py
+++ b/autorag/cli.py
@@ -0,0 +1,40 @@
 import logging
 import os
 import click
 from autorag import dashboard
 logger = logging.getLogger("AutoRAG")
 autorag_dir = os.path.dirname(os.path.realpath(__file__))
 version_file = os.path.join(autorag_dir, "VERSION")
 with open(version_file, "r") as f:
    __version__ = f.read().strip()
@click.group()
@click.version_option(__version__)
 def cli():
    pass
@click.command()
@click.option(
    "--trial_dir",
    type=click.Path(dir_okay=True, file_okay=False, exists=True),
    required=True,
 )
@click.option(
    "--port", type=int, default=7690, help="Port number. The default is 7690."
 )
 def run_dashboard(trial_dir: str, port: int):
    """Runs the AutoRAG Dashboard."""
    logger.info(f"Starting AutoRAG Dashboard on port {port}...")
    dashboard.run(trial_dir, port=port)
 cli.add_command(run_dashboard, "dashboard")
 if __name__ == "__main__":
    cli()
--- a/autorag/dashboard.py
+++ b/autorag/dashboard.py
@@ -0,0 +1,215 @@
 import ast
 import logging
 import os
 from typing import Dict, List
 import matplotlib.pyplot as plt
 import pandas as pd
 import panel as pn
 import seaborn as sns
 import yaml
 from bokeh.models import NumberFormatter, BooleanFormatter
 from autorag.utils.util import dict_to_markdown, dict_to_markdown_table
 pn.extension(
 	"terminal",
 	"tabulator",
 	"mathjax",
 	"ipywidgets",
 	console_output="disable",
 	sizing_mode="stretch_width",
 	css_files=[
 		"https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.2/css/all.min.css"
 	],
 )
 logger = logging.getLogger("AutoRAG")
 def find_node_dir(trial_dir: str) -> List[str]:
 	trial_summary_df = pd.read_csv(os.path.join(trial_dir, "summary.csv"))
 	result_paths = []
 	for idx, row in trial_summary_df.iterrows():
 		node_line_name = row["node_line_name"]
 		node_type = row["node_type"]
 		result_paths.append(os.path.join(trial_dir, node_line_name, node_type))
 	return result_paths
 def get_metric_values(node_summary_df: pd.DataFrame) -> Dict:
 	non_metric_column_names = [
 		"filename",
 		"module_name",
 		"module_params",
 		"execution_time",
 		"average_output_token",
 		"is_best",
 	]
 	best_row = node_summary_df.loc[node_summary_df["is_best"]].drop(
 		columns=non_metric_column_names, errors="ignore"
 	)
 	assert len(best_row) == 1, "The best module must be only one."
 	return best_row.iloc[0].to_dict()
 def make_trial_summary_md(trial_dir):
 	markdown_text = f"""# Trial Result Summary
 - Trial Directory : {trial_dir}
 """
 	node_dirs = find_node_dir(trial_dir)
 	for node_dir in node_dirs:
 		node_summary_filepath = os.path.join(node_dir, "summary.csv")
 		node_type = os.path.basename(node_dir)
 		node_summary_df = pd.read_csv(node_summary_filepath)
 		best_row = node_summary_df.loc[node_summary_df["is_best"]].iloc[0]
 		metric_dict = get_metric_values(node_summary_df)
 		markdown_text += f"""---
 ## {node_type} best module
 ### Module Name
 {best_row['module_name']}
 ### Module Params
 {dict_to_markdown(ast.literal_eval(best_row['module_params']), level=3)}
 ### Metric Values
 {dict_to_markdown_table(metric_dict, key_column_name='metric_name', value_column_name='metric_value')}
 """
 	return markdown_text
 def node_view(node_dir: str):
 	non_metric_column_names = [
 		"filename",
 		"module_name",
 		"module_params",
 		"execution_time",
 		"average_output_token",
 		"is_best",
 	]
 	summary_df = pd.read_csv(os.path.join(node_dir, "summary.csv"))
 	bokeh_formatters = {
 		"float": NumberFormatter(format="0.000"),
 		"bool": BooleanFormatter(),
 	}
 	first_df = pd.read_parquet(os.path.join(node_dir, "0.parquet"), engine="pyarrow")
 	each_module_df_widget = pn.widgets.Tabulator(
 		pd.DataFrame(columns=first_df.columns),
 		name="Module DataFrame",
 		formatters=bokeh_formatters,
 		pagination="local",
 		page_size=20,
 		widths=150,
 	)
 	def change_module_widget(event):
 		if event.column == "detail":
 			filename = summary_df["filename"].iloc[event.row]
 			filepath = os.path.join(node_dir, filename)
 			each_module_df = pd.read_parquet(filepath, engine="pyarrow")
 			each_module_df_widget.value = each_module_df
 	df_widget = pn.widgets.Tabulator(
 		summary_df,
 		name="Summary DataFrame",
 		formatters=bokeh_formatters,
 		buttons={"detail": '<i class="fa fa-eye"></i>'},
 		widths=150,
 	)
 	df_widget.on_click(change_module_widget)
 	try:
 		fig, ax = plt.subplots(figsize=(10, 5))
 		metric_df = summary_df.drop(columns=non_metric_column_names, errors="ignore")
 		sns.stripplot(data=metric_df, ax=ax)
 		strip_plot_pane = pn.pane.Matplotlib(fig, tight=True)
 		fig2, ax2 = plt.subplots(figsize=(10, 5))
 		sns.boxplot(data=metric_df, ax=ax2)
 		box_plot_pane = pn.pane.Matplotlib(fig2, tight=True)
 		plot_pane = pn.Row(strip_plot_pane, box_plot_pane)
 		layout = pn.Column(
 			"## Summary distribution plot",
 			plot_pane,
 			"## Summary DataFrame",
 			df_widget,
 			"## Module Result DataFrame",
 			each_module_df_widget,
 		)
 	except Exception as e:
 		logger.error(f"Skipping make boxplot and stripplot with error {e}")
 		layout = pn.Column("## Summary DataFrame", df_widget)
 	layout.servable()
 	return layout
 CSS = """
 div.card-margin:nth-child(1) {
    max-height: 300px;
 }
 div.card-margin:nth-child(2) {
    max-height: 400px;
 }
 """
 def yaml_to_markdown(yaml_filepath):
 	markdown_content = ""
 	with open(yaml_filepath, "r", encoding="utf-8") as file:
 		try:
 			content = yaml.safe_load(file)
 			markdown_content += f"## {os.path.basename(yaml_filepath)}\n```yaml\n{yaml.safe_dump(content, allow_unicode=True)}\n```\n\n"
 		except yaml.YAMLError as exc:
 			print(f"Error in {yaml_filepath}: {exc}")
 	return markdown_content
 def run(trial_dir: str, port: int = 7690):
 	trial_summary_md = make_trial_summary_md(trial_dir=trial_dir)
 	trial_summary_tab = pn.pane.Markdown(trial_summary_md, sizing_mode="stretch_width")
 	node_views = [
    (str(os.path.basename(node_dir)), pn.bind(node_view, node_dir))
    for node_dir in find_node_dir(trial_dir)
 	]
 	"""
 	수정 전
 	node_views = [
    (str(os.path.basename(node_dir)), node_view(node_dir))
    for node_dir in find_node_dir(trial_dir)
 	]
 	"""
 	yaml_file_markdown = yaml_to_markdown(os.path.join(trial_dir, "config.yaml"))
 	yaml_file = pn.pane.Markdown(yaml_file_markdown, sizing_mode="stretch_width")
 	tabs = pn.Tabs(
 		("Summary", trial_summary_tab),
 		*node_views,
 		("Used YAML file", yaml_file),
 		dynamic=True,
 	)
 	'''
 	수정 전
 	template = pn.template.FastListTemplate(
 		site="AutoRAG", title="Dashboard", main=[tabs], raw_css=[CSS]
 	).servable()
 	template.show(port=port)
 	'''
 	if CSS not in pn.config.raw_css:
 		pn.config.raw_css.append(CSS)
 	template = pn.template.FastListTemplate(
 		site="AutoRAG", title="Dashboard", main=[tabs]
 	).servable()
 	pn.serve(template, port=port, show=False)
--- a/autorag/schema/init.py
+++ b/autorag/schema/init.py
@@ -0,0 +1,3 @@
 from .module import Module
 from .node import Node
 from .base import BaseModule
--- a/autorag/schema/pycache/init.cpython-310.pyc
+++ b/autorag/schema/pycache/init.cpython-310.pyc
--- a/autorag/schema/pycache/base.cpython-310.pyc
+++ b/autorag/schema/pycache/base.cpython-310.pyc
--- a/autorag/schema/pycache/metricinput.cpython-310.pyc
+++ b/autorag/schema/pycache/metricinput.cpython-310.pyc
--- a/autorag/schema/pycache/module.cpython-310.pyc
+++ b/autorag/schema/pycache/module.cpython-310.pyc
--- a/autorag/schema/pycache/node.cpython-310.pyc
+++ b/autorag/schema/pycache/node.cpython-310.pyc
--- a/autorag/schema/base.py
+++ b/autorag/schema/base.py
@@ -0,0 +1,35 @@
 from abc import ABCMeta, abstractmethod
 from pathlib import Path
 from typing import Union
 import pandas as pd
 class BaseModule(metaclass=ABCMeta):
 	@abstractmethod
 	def pure(self, previous_result: pd.DataFrame, *args, **kwargs):
 		pass
 	@abstractmethod
 	def _pure(self, *args, **kwargs):
 		pass
 	@classmethod
 	def run_evaluator(
 		cls,
 		project_dir: Union[str, Path],
 		previous_result: pd.DataFrame,
 		*args,
 		**kwargs,
 	):
 		instance = cls(project_dir, *args, **kwargs)
 		result = instance.pure(previous_result, *args, **kwargs)
 		del instance
 		return result
 	@abstractmethod
 	def cast_to_run(self, previous_result: pd.DataFrame, *args, **kwargs):
 		"""
 		This function is for cast function (a.k.a decorator) only for pure function in the whole node.
 		"""
 		pass
--- a/autorag/schema/metricinput.py
+++ b/autorag/schema/metricinput.py
@@ -0,0 +1,99 @@
 from dataclasses import dataclass
 from typing import Optional, List, Dict, Callable, Any, Union
 import numpy as np
 import pandas as pd
@dataclass
 class MetricInput:
 	query: Optional[str] = None
 	queries: Optional[List[str]] = None
 	retrieval_gt_contents: Optional[List[List[str]]] = None
 	retrieved_contents: Optional[List[str]] = None
 	retrieval_gt: Optional[List[List[str]]] = None
 	retrieved_ids: Optional[List[str]] = None
 	prompt: Optional[str] = None
 	generated_texts: Optional[str] = None
 	generation_gt: Optional[List[str]] = None
 	generated_log_probs: Optional[List[float]] = None
 	def is_fields_notnone(self, fields_to_check: List[str]) -> bool:
 		for field in fields_to_check:
 			actual_value = getattr(self, field)
 			if actual_value is None:
 				return False
 			try:
 				if not type_checks.get(type(actual_value), lambda _: False)(
 					actual_value
 				):
 					return False
 			except Exception:
 				return False
 		return True
 	@classmethod
 	def from_dataframe(cls, qa_data: pd.DataFrame) -> List["MetricInput"]:
 		"""
 		Convert a pandas DataFrame into a list of MetricInput instances.
 		qa_data: pd.DataFrame: qa_data DataFrame containing metric data.
 		:returns: List[MetricInput]: List of MetricInput objects created from DataFrame rows.
 		"""
 		instances = []
 		for _, row in qa_data.iterrows():
 			instance = cls()
 			for attr_name in cls.__annotations__:
 				if attr_name in row:
 					value = row[attr_name]
 					if isinstance(value, str):
 						setattr(
 							instance,
 							attr_name,
 							value.strip() if value.strip() != "" else None,
 						)
 					elif isinstance(value, list):
 						setattr(instance, attr_name, value if len(value) > 0 else None)
 					else:
 						setattr(instance, attr_name, value)
 			instances.append(instance)
 		return instances
 	@staticmethod
 	def _check_list(lst_or_arr: Union[List[Any], np.ndarray]) -> bool:
 		if isinstance(lst_or_arr, np.ndarray):
 			lst_or_arr = lst_or_arr.flatten().tolist()
 		if len(lst_or_arr) == 0:
 			return False
 		for item in lst_or_arr:
 			if item is None:
 				return False
 			item_type = type(item)
 			if item_type in type_checks:
 				if not type_checks[item_type](item):
 					return False
 			else:
 				return False
 		return True
 type_checks: Dict[type, Callable[[Any], bool]] = {
 	str: lambda x: len(x.strip()) > 0,
 	list: MetricInput._check_list,
 	np.ndarray: MetricInput._check_list,
 	int: lambda _: True,
 	float: lambda _: True,
 }
--- a/autorag/schema/module.py
+++ b/autorag/schema/module.py
@@ -0,0 +1,24 @@
 from copy import deepcopy
 from dataclasses import dataclass, field
 from typing import Callable, Dict
 from autorag.support import get_support_modules
@dataclass
 class Module:
 	module_type: str
 	module_param: Dict
 	module: Callable = field(init=False)
 	def __post_init__(self):
 		self.module = get_support_modules(self.module_type)
 		if self.module is None:
 			raise ValueError(f"Module type {self.module_type} is not supported.")
 	@classmethod
 	def from_dict(cls, module_dict: Dict) -> "Module":
 		_module_dict = deepcopy(module_dict)
 		module_type = _module_dict.pop("module_type")
 		module_params = _module_dict
 		return cls(module_type, module_params)
--- a/autorag/schema/node.py
+++ b/autorag/schema/node.py
@@ -0,0 +1,143 @@
 import itertools
 import logging
 from copy import deepcopy
 from dataclasses import dataclass, field
 from typing import Dict, List, Callable, Tuple, Any
 import pandas as pd
 from autorag.schema.module import Module
 from autorag.support import get_support_nodes
 from autorag.utils.util import make_combinations, explode, find_key_values
 logger = logging.getLogger("AutoRAG")
@dataclass
 class Node:
 	node_type: str
 	strategy: Dict
 	node_params: Dict
 	modules: List[Module]
 	run_node: Callable = field(init=False)
 	def __post_init__(self):
 		self.run_node = get_support_nodes(self.node_type)
 		if self.run_node is None:
 			raise ValueError(f"Node type {self.node_type} is not supported.")
 	def get_param_combinations(self) -> Tuple[List[Callable], List[Dict]]:
 		"""
 		This method returns a combination of module and node parameters, also corresponding modules.
 		:return: Each module and its module parameters.
 		:rtype: Tuple[List[Callable], List[Dict]]
 		"""
 		def make_single_combination(module: Module) -> List[Dict]:
 			input_dict = {**self.node_params, **module.module_param}
 			return make_combinations(input_dict)
 		combinations = list(map(make_single_combination, self.modules))
 		module_list, combination_list = explode(self.modules, combinations)
 		return list(map(lambda x: x.module, module_list)), combination_list
 	@classmethod
 	def from_dict(cls, node_dict: Dict) -> "Node":
 		_node_dict = deepcopy(node_dict)
 		node_type = _node_dict.pop("node_type")
 		strategy = _node_dict.pop("strategy")
 		modules = list(map(lambda x: Module.from_dict(x), _node_dict.pop("modules")))
 		node_params = _node_dict
 		return cls(node_type, strategy, node_params, modules)
 	def run(self, previous_result: pd.DataFrame, node_line_dir: str) -> pd.DataFrame:
 		logger.info(f"Running node {self.node_type}...")
 		input_modules, input_params = self.get_param_combinations()
 		return self.run_node(
 			modules=input_modules,
 			module_params=input_params,
 			previous_result=previous_result,
 			node_line_dir=node_line_dir,
 			strategies=self.strategy,
 		)
 def extract_values(node: Node, key: str) -> List[str]:
 	"""
 	This function extract values from node's modules' module_param.
 	:param node: The node you want to extract values from.
 	:param key: The key of module_param that you want to extract.
 	:return: The list of extracted values.
 	    It removes duplicated elements automatically.
 	"""
 	def extract_module_values(module: Module):
 		if key not in module.module_param:
 			return []
 		value = module.module_param[key]
 		if isinstance(value, str) or isinstance(value, int):
 			return [value]
 		elif isinstance(value, list):
 			return value
 		else:
 			raise ValueError(f"{key} must be str,list or int, but got {type(value)}")
 	values = list(map(extract_module_values, node.modules))
 	return list(set(list(itertools.chain.from_iterable(values))))
 def extract_values_from_nodes(nodes: List[Node], key: str) -> List[str]:
 	"""
 	This function extract values from nodes' modules' module_param.
 	:param nodes: The nodes you want to extract values from.
 	:param key: The key of module_param that you want to extract.
 	:return: The list of extracted values.
 	    It removes duplicated elements automatically.
 	"""
 	values = list(map(lambda node: extract_values(node, key), nodes))
 	return list(set(list(itertools.chain.from_iterable(values))))
 def extract_values_from_nodes_strategy(nodes: List[Node], key: str) -> List[Any]:
 	"""
 	This function extract values from nodes' strategy.
 	:param nodes: The nodes you want to extract values from.
 	:param key: The key string that you want to extract.
 	:return: The list of extracted values.
 	    It removes duplicated elements automatically.
 	"""
 	values = []
 	for node in nodes:
 		value_list = find_key_values(node.strategy, key)
 		if value_list:
 			values.extend(value_list)
 	return values
 def module_type_exists(nodes: List[Node], module_type: str) -> bool:
 	"""
 	This function check if the module type exists in the nodes.
 	:param nodes: The nodes you want to check.
 	:param module_type: The module type you want to check.
 	:return: True if the module type exists in the nodes.
 	"""
 	return any(
 		list(
 			map(
 				lambda node: any(
 					list(
 						map(
 							lambda module: module.module_type == module_type,
 							node.modules,
 						)
 					)
 				),
 				nodes,
 			)
 		)
 	)
--- a/autorag/utils/init.py
+++ b/autorag/utils/init.py
@@ -0,0 +1,8 @@
 from .preprocess import (
 	validate_qa_dataset,
 	validate_corpus_dataset,
 	cast_qa_dataset,
 	cast_corpus_dataset,
 	validate_qa_from_corpus_dataset,
 )
 from .util import fetch_contents, result_to_dataframe, sort_by_scores
--- a/autorag/utils/pycache/init.cpython-310.pyc
+++ b/autorag/utils/pycache/init.cpython-310.pyc
--- a/autorag/utils/pycache/preprocess.cpython-310.pyc
+++ b/autorag/utils/pycache/preprocess.cpython-310.pyc
--- a/autorag/utils/pycache/util.cpython-310.pyc
+++ b/autorag/utils/pycache/util.cpython-310.pyc
--- a/autorag/utils/preprocess.py
+++ b/autorag/utils/preprocess.py
@@ -0,0 +1,149 @@
 from datetime import datetime
 import numpy as np
 import pandas as pd
 from autorag.utils.util import preprocess_text
 def validate_qa_dataset(df: pd.DataFrame):
 	columns = ["qid", "query", "retrieval_gt", "generation_gt"]
 	assert set(columns).issubset(
 		df.columns
 	), f"df must have columns {columns}, but got {df.columns}"
 def validate_corpus_dataset(df: pd.DataFrame):
 	columns = ["doc_id", "contents", "metadata"]
 	assert set(columns).issubset(
 		df.columns
 	), f"df must have columns {columns}, but got {df.columns}"
 def cast_qa_dataset(df: pd.DataFrame):
 	def cast_retrieval_gt(gt):
 		if isinstance(gt, str):
 			return [[gt]]
 		elif isinstance(gt, list):
 			if isinstance(gt[0], str):
 				return [gt]
 			elif isinstance(gt[0], list):
 				return gt
 			elif isinstance(gt[0], np.ndarray):
 				return cast_retrieval_gt(list(map(lambda x: x.tolist(), gt)))
 			else:
 				raise ValueError(
 					f"retrieval_gt must be str or list, but got {type(gt[0])}"
 				)
 		elif isinstance(gt, np.ndarray):
 			return cast_retrieval_gt(gt.tolist())
 		else:
 			raise ValueError(f"retrieval_gt must be str or list, but got {type(gt)}")
 	def cast_generation_gt(gt):
 		if isinstance(gt, str):
 			return [gt]
 		elif isinstance(gt, list):
 			return gt
 		elif isinstance(gt, np.ndarray):
 			return cast_generation_gt(gt.tolist())
 		else:
 			raise ValueError(f"generation_gt must be str or list, but got {type(gt)}")
 	df = df.reset_index(drop=True)
 	validate_qa_dataset(df)
 	assert df["qid"].apply(lambda x: isinstance(x, str)).sum() == len(
 		df
 	), "qid must be string type."
 	assert df["query"].apply(lambda x: isinstance(x, str)).sum() == len(
 		df
 	), "query must be string type."
 	df["retrieval_gt"] = df["retrieval_gt"].apply(cast_retrieval_gt)
 	df["generation_gt"] = df["generation_gt"].apply(cast_generation_gt)
 	df["query"] = df["query"].apply(preprocess_text)
 	df["generation_gt"] = df["generation_gt"].apply(
 		lambda x: list(map(preprocess_text, x))
 	)
 	return df
 def cast_corpus_dataset(df: pd.DataFrame):
 	df = df.reset_index(drop=True)
 	validate_corpus_dataset(df)
 	# drop rows that have empty contents
 	df = df[~df["contents"].apply(lambda x: x is None or x.isspace())]
 	def make_datetime_metadata(x):
 		if x is None or x == {}:
 			return {"last_modified_datetime": datetime.now()}
 		elif x.get("last_modified_datetime") is None:
 			return {**x, "last_modified_datetime": datetime.now()}
 		else:
 			return x
 	df["metadata"] = df["metadata"].apply(make_datetime_metadata)
 	# check every metadata have a datetime key
 	assert sum(
 		df["metadata"].apply(lambda x: x.get("last_modified_datetime") is not None)
 	) == len(df), "Every metadata must have a datetime key."
 	def make_prev_next_id_metadata(x, id_type: str):
 		if x is None or x == {}:
 			return {id_type: None}
 		elif x.get(id_type) is None:
 			return {**x, id_type: None}
 		else:
 			return x
 	df["metadata"] = df["metadata"].apply(
 		lambda x: make_prev_next_id_metadata(x, "prev_id")
 	)
 	df["metadata"] = df["metadata"].apply(
 		lambda x: make_prev_next_id_metadata(x, "next_id")
 	)
 	df["contents"] = df["contents"].apply(preprocess_text)
 	def normalize_unicode_metadata(metadata: dict):
 		result = {}
 		for key, value in metadata.items():
 			if isinstance(value, str):
 				result[key] = preprocess_text(value)
 			else:
 				result[key] = value
 		return result
 	df["metadata"] = df["metadata"].apply(normalize_unicode_metadata)
 	# check every metadata have a prev_id, next_id key
 	assert all(
 		"prev_id" in metadata for metadata in df["metadata"]
 	), "Every metadata must have a prev_id key."
 	assert all(
 		"next_id" in metadata for metadata in df["metadata"]
 	), "Every metadata must have a next_id key."
 	return df
 def validate_qa_from_corpus_dataset(qa_df: pd.DataFrame, corpus_df: pd.DataFrame):
 	qa_ids = []
 	for retrieval_gt in qa_df["retrieval_gt"].tolist():
 		if isinstance(retrieval_gt, list) and (
 			retrieval_gt[0] != [] or any(bool(g) is True for g in retrieval_gt)
 		):
 			for gt in retrieval_gt:
 				qa_ids.extend(gt)
 		elif isinstance(retrieval_gt, np.ndarray) and retrieval_gt[0].size > 0:
 			for gt in retrieval_gt:
 				qa_ids.extend(gt)
 	no_exist_ids = list(
 		filter(lambda qa_id: corpus_df[corpus_df["doc_id"] == qa_id].empty, qa_ids)
 	)
 	assert (
 		len(no_exist_ids) == 0
 	), f"{len(no_exist_ids)} doc_ids in retrieval_gt do not exist in corpus_df."
--- a/autorag/utils/util.py
+++ b/autorag/utils/util.py
@@ -0,0 +1,751 @@
 import ast
 import asyncio
 import datetime
 import functools
 import glob
 import inspect
 import itertools
 import json
 import logging
 import os
 import re
 import string
 from copy import deepcopy
 from json import JSONDecoder
 from typing import List, Callable, Dict, Optional, Any, Collection, Iterable
 from asyncio import AbstractEventLoop
 import emoji
 import numpy as np
 import pandas as pd
 import tiktoken
 import unicodedata
 import yaml
 from llama_index.embeddings.openai import OpenAIEmbedding
 from pydantic import BaseModel as BM
 from pydantic.v1 import BaseModel
 logger = logging.getLogger("AutoRAG")
 def fetch_contents(
 	corpus_data: pd.DataFrame, ids: List[List[str]], column_name: str = "contents"
 ) -> List[List[Any]]:
 	def fetch_contents_pure(
 		ids: List[str], corpus_data: pd.DataFrame, column_name: str
 	):
 		return list(map(lambda x: fetch_one_content(corpus_data, x, column_name), ids))
 	result = flatten_apply(
 		fetch_contents_pure, ids, corpus_data=corpus_data, column_name=column_name
 	)
 	return result
 def fetch_one_content(
 	corpus_data: pd.DataFrame,
 	id_: str,
 	column_name: str = "contents",
 	id_column_name: str = "doc_id",
 ) -> Any:
 	if isinstance(id_, str):
 		if id_ in ["", ""]:
 			return None
 		fetch_result = corpus_data[corpus_data[id_column_name] == id_]
 		if fetch_result.empty:
 			raise ValueError(f"doc_id: {id_} not found in corpus_data.")
 		else:
 			return fetch_result[column_name].iloc[0]
 	else:
 		return None
 def result_to_dataframe(column_names: List[str]):
 	"""
 	Decorator for converting results to pd.DataFrame.
 	"""
 	def decorator_result_to_dataframe(func: Callable):
 		@functools.wraps(func)
 		def wrapper(*args, **kwargs) -> pd.DataFrame:
 			results = func(*args, **kwargs)
 			if len(column_names) == 1:
 				df_input = {column_names[0]: results}
 			else:
 				df_input = {
 					column_name: result
 					for result, column_name in zip(results, column_names)
 				}
 			result_df = pd.DataFrame(df_input)
 			return result_df
 		return wrapper
 	return decorator_result_to_dataframe
 def load_summary_file(
 	summary_path: str, dict_columns: Optional[List[str]] = None
 ) -> pd.DataFrame:
 	"""
 	Load a summary file from summary_path.
 	:param summary_path: The path of the summary file.
 	:param dict_columns: The columns that are dictionary type.
 	    You must fill this parameter if you want to load summary file properly.
 	    Default is ['module_params'].
 	:return: The summary dataframe.
 	"""
 	if not os.path.exists(summary_path):
 		raise ValueError(f"summary.csv does not exist in {summary_path}.")
 	summary_df = pd.read_csv(summary_path)
 	if dict_columns is None:
 		dict_columns = ["module_params"]
 	if any([col not in summary_df.columns for col in dict_columns]):
 		raise ValueError(f"{dict_columns} must be in summary_df.columns.")
 	def convert_dict(elem):
 		try:
 			return ast.literal_eval(elem)
 		except:
 			# convert datetime or date to its object (recency filter)
 			date_object = convert_datetime_string(elem)
 			if date_object is None:
 				raise ValueError(
 					f"Malformed dict received : {elem}\nCan't convert to dict properly"
 				)
 			return {"threshold": date_object}
 	summary_df[dict_columns] = summary_df[dict_columns].map(convert_dict)
 	return summary_df
 def convert_datetime_string(s):
 	# Regex to extract datetime arguments from the string
 	m = re.search(r"(datetime|date)(\((\d+)(,\s*\d+)*\))", s)
 	if m:
 		args = ast.literal_eval(m.group(2))
 		if m.group(1) == "datetime":
 			return datetime.datetime(*args)
 		elif m.group(1) == "date":
 			return datetime.date(*args)
 	return None
 def make_combinations(target_dict: Dict[str, Any]) -> List[Dict[str, Any]]:
 	"""
 	Make combinations from target_dict.
 	The target_dict key value must be a string,
 	and the value can be a list of values or single value.
 	If generates all combinations of values from target_dict,
 	which means generating dictionaries that contain only one value for each key,
 	and all dictionaries will be different from each other.
 	:param target_dict: The target dictionary.
 	:return: The list of generated dictionaries.
 	"""
 	dict_with_lists = dict(
 		map(
 			lambda x: (x[0], x[1] if isinstance(x[1], list) else [x[1]]),
 			target_dict.items(),
 		)
 	)
 	def delete_duplicate(x):
 		def is_hashable(obj):
 			try:
 				hash(obj)
 				return True
 			except TypeError:
 				return False
 		if any([not is_hashable(elem) for elem in x]):
 			# TODO: add duplication check for unhashable objects
 			return x
 		else:
 			return list(set(x))
 	dict_with_lists = dict(
 		map(lambda x: (x[0], delete_duplicate(x[1])), dict_with_lists.items())
 	)
 	combination = list(itertools.product(*dict_with_lists.values()))
 	combination_dicts = [
 		dict(zip(dict_with_lists.keys(), combo)) for combo in combination
 	]
 	return combination_dicts
 def explode(index_values: Collection[Any], explode_values: Collection[Collection[Any]]):
 	"""
 	Explode index_values and explode_values.
 	The index_values and explode_values must have the same length.
 	It will flatten explode_values and keep index_values as a pair.
 	:param index_values: The index values.
 	:param explode_values: The exploded values.
 	:return: Tuple of exploded index_values and exploded explode_values.
 	"""
 	assert len(index_values) == len(
 		explode_values
 	), "Index values and explode values must have same length"
 	df = pd.DataFrame({"index_values": index_values, "explode_values": explode_values})
 	df = df.explode("explode_values")
 	return df["index_values"].tolist(), df["explode_values"].tolist()
 def replace_value_in_dict(target_dict: Dict, key: str, replace_value: Any) -> Dict:
 	"""
 	Replace the value of a certain key in target_dict.
 	If there is no targeted key in target_dict, it will return target_dict.
 	:param target_dict: The target dictionary.
 	:param key: The key is to replace.
 	:param replace_value: The value to replace.
 	:return: The replaced dictionary.
 	"""
 	replaced_dict = deepcopy(target_dict)
 	if key not in replaced_dict:
 		return replaced_dict
 	replaced_dict[key] = replace_value
 	return replaced_dict
 def normalize_string(s: str) -> str:
 	"""
 	Taken from the official evaluation script for v1.1 of the SQuAD dataset.
 	Lower text and remove punctuation, articles, and extra whitespace.
 	"""
 	def remove_articles(text):
 		return re.sub(r"\b(a|an|the)\b", " ", text)
 	def white_space_fix(text):
 		return " ".join(text.split())
 	def remove_punc(text):
 		exclude = set(string.punctuation)
 		return "".join(ch for ch in text if ch not in exclude)
 	def lower(text):
 		return text.lower()
 	return white_space_fix(remove_articles(remove_punc(lower(s))))
 def convert_string_to_tuple_in_dict(d):
 	"""Recursively converts strings that start with '(' and end with ')' to tuples in a dictionary."""
 	for key, value in d.items():
 		# If the value is a dictionary, recurse
 		if isinstance(value, dict):
 			convert_string_to_tuple_in_dict(value)
 		# If the value is a list, iterate through its elements
 		elif isinstance(value, list):
 			for i, item in enumerate(value):
 				# If an item in the list is a dictionary, recurse
 				if isinstance(item, dict):
 					convert_string_to_tuple_in_dict(item)
 				# If an item in the list is a string matching the criteria, convert it to a tuple
 				elif (
 					isinstance(item, str)
 					and item.startswith("(")
 					and item.endswith(")")
 				):
 					value[i] = ast.literal_eval(item)
 		# If the value is a string matching the criteria, convert it to a tuple
 		elif isinstance(value, str) and value.startswith("(") and value.endswith(")"):
 			d[key] = ast.literal_eval(value)
 	return d
 def convert_env_in_dict(d: Dict):
 	"""
 	Recursively converts environment variable string in a dictionary to actual environment variable.
 	:param d: The dictionary to convert.
 	:return: The converted dictionary.
 	"""
 	env_pattern = re.compile(r".*?\${(.*?)}.*?")
 	def convert_env(val: str):
 		matches = env_pattern.findall(val)
 		for match in matches:
 			val = val.replace(f"${{{match}}}", os.environ.get(match, ""))
 		return val
 	for key, value in d.items():
 		if isinstance(value, dict):
 			convert_env_in_dict(value)
 		elif isinstance(value, list):
 			for i, item in enumerate(value):
 				if isinstance(item, dict):
 					convert_env_in_dict(item)
 				elif isinstance(item, str):
 					value[i] = convert_env(item)
 		elif isinstance(value, str):
 			d[key] = convert_env(value)
 	return d
 async def process_batch(tasks, batch_size: int = 64) -> List[Any]:
 	"""
 	Processes tasks in batches asynchronously.
 	:param tasks: A list of no-argument functions or coroutines to be executed.
 	:param batch_size: The number of tasks to process in a single batch.
 	    Default is 64.
 	:return: A list of results from the processed tasks.
 	"""
 	results = []
 	for i in range(0, len(tasks), batch_size):
 		batch = tasks[i : i + batch_size]
 		batch_results = await asyncio.gather(*batch)
 		results.extend(batch_results)
 	return results
 def make_batch(elems: List[Any], batch_size: int) -> List[List[Any]]:
 	"""
 	Make a batch of elems with batch_size.
 	"""
 	return [elems[i : i + batch_size] for i in range(0, len(elems), batch_size)]
 def save_parquet_safe(df: pd.DataFrame, filepath: str, upsert: bool = False):
 	output_file_dir = os.path.dirname(filepath)
 	if not os.path.isdir(output_file_dir):
 		raise NotADirectoryError(f"directory {output_file_dir} not found.")
 	if not filepath.endswith("parquet"):
 		raise NameError(
 			f'file path: {filepath}  filename extension need to be ".parquet"'
 		)
 	if os.path.exists(filepath) and not upsert:
 		raise FileExistsError(
 			f"file {filepath} already exists."
 			"Set upsert True if you want to overwrite the file."
 		)
 	df.to_parquet(filepath, index=False)
 def openai_truncate_by_token(
 	texts: List[str], token_limit: int, model_name: str
 ) -> List[str]:
 	try:
 		tokenizer = tiktoken.encoding_for_model(model_name)
 	except KeyError:
 		# This is not a real OpenAI model
 		return texts
 	def truncate_text(text: str, limit: int, tokenizer):
 		tokens = tokenizer.encode(text)
 		if len(tokens) <= limit:
 			return text
 		truncated_text = tokenizer.decode(tokens[:limit])
 		return truncated_text
 	return list(map(lambda x: truncate_text(x, token_limit, tokenizer), texts))
 def reconstruct_list(flat_list: List[Any], lengths: List[int]) -> List[List[Any]]:
 	result = []
 	start = 0
 	for length in lengths:
 		result.append(flat_list[start : start + length])
 		start += length
 	return result
 def flatten_apply(
 	func: Callable, nested_list: List[List[Any]], **kwargs
 ) -> List[List[Any]]:
 	"""
 	This function flattens the input list and applies the function to the elements.
 	After that, it reconstructs the list to the original shape.
 	Its speciality is that the first dimension length of the list can be different from each other.
 	:param func: The function that applies to the flattened list.
 	:param nested_list: The nested list to be flattened.
 	:return: The list that is reconstructed after applying the function.
 	"""
 	df = pd.DataFrame({"col1": nested_list})
 	df = df.explode("col1")
 	df["result"] = func(df["col1"].tolist(), **kwargs)
 	return df.groupby(level=0, sort=False)["result"].apply(list).tolist()
 async def aflatten_apply(
 	func: Callable, nested_list: List[List[Any]], **kwargs
 ) -> List[List[Any]]:
 	"""
 	This function flattens the input list and applies the function to the elements.
 	After that, it reconstructs the list to the original shape.
 	Its speciality is that the first dimension length of the list can be different from each other.
 	:param func: The function that applies to the flattened list.
 	:param nested_list: The nested list to be flattened.
 	:return: The list that is reconstructed after applying the function.
 	"""
 	df = pd.DataFrame({"col1": nested_list})
 	df = df.explode("col1")
 	df["result"] = await func(df["col1"].tolist(), **kwargs)
 	return df.groupby(level=0, sort=False)["result"].apply(list).tolist()
 def sort_by_scores(row, reverse=True):
 	"""
 	Sorts each row by 'scores' column.
 	The input column names must be 'contents', 'ids', and 'scores'.
 	And its elements must be list type.
 	"""
 	results = sorted(
 		zip(row["contents"], row["ids"], row["scores"]),
 		key=lambda x: x[2],
 		reverse=reverse,
 	)
 	reranked_contents, reranked_ids, reranked_scores = zip(*results)
 	return list(reranked_contents), list(reranked_ids), list(reranked_scores)
 def select_top_k(df, column_names: List[str], top_k: int):
 	for column_name in column_names:
 		df[column_name] = df[column_name].apply(lambda x: x[:top_k])
 	return df
 def filter_dict_keys(dict_, keys: List[str]):
 	result = {}
 	for key in keys:
 		if key in dict_:
 			result[key] = dict_[key]
 		else:
 			raise KeyError(f"Key '{key}' not found in dictionary.")
 	return result
 def split_dataframe(df, chunk_size):
 	num_chunks = (
 		len(df) // chunk_size + 1
 		if len(df) % chunk_size != 0
 		else len(df) // chunk_size
 	)
 	result = list(
 		map(lambda x: df[x * chunk_size : (x + 1) * chunk_size], range(num_chunks))
 	)
 	result = list(map(lambda x: x.reset_index(drop=True), result))
 	return result
 def find_trial_dir(project_dir: str) -> List[str]:
 	# Pattern to match directories named with numbers
 	pattern = os.path.join(project_dir, "[0-9]*")
 	all_entries = glob.glob(pattern)
 	# Filter out only directories
 	trial_dirs = [
 		entry
 		for entry in all_entries
 		if os.path.isdir(entry) and entry.split(os.sep)[-1].isdigit()
 	]
 	return trial_dirs
 def find_node_summary_files(trial_dir: str) -> List[str]:
 	# Find all summary.csv files recursively
 	all_summary_files = glob.glob(
 		os.path.join(trial_dir, "**", "summary.csv"), recursive=True
 	)
 	# Filter out files that are at a lower directory level
 	filtered_files = [
 		f for f in all_summary_files if f.count(os.sep) > trial_dir.count(os.sep) + 2
 	]
 	return filtered_files
 def preprocess_text(text: str) -> str:
 	return normalize_unicode(demojize(text))
 def demojize(text: str) -> str:
 	return emoji.demojize(text)
 def normalize_unicode(text: str) -> str:
 	return unicodedata.normalize("NFC", text)
 def dict_to_markdown(d, level=1):
 	"""
 	Convert a dictionary to a Markdown formatted string.
 	:param d: Dictionary to convert
 	:param level: Current level of heading (used for nested dictionaries)
 	:return: Markdown formatted string
 	"""
 	markdown = ""
 	for key, value in d.items():
 		if isinstance(value, dict):
 			markdown += f"{'#' * level} {key}\n"
 			markdown += dict_to_markdown(value, level + 1)
 		elif isinstance(value, list):
 			markdown += f"{'#' * level} {key}\n"
 			for item in value:
 				if isinstance(item, dict):
 					markdown += dict_to_markdown(item, level + 1)
 				else:
 					markdown += f"- {item}\n"
 		else:
 			markdown += f"{'#' * level} {key}\n{value}\n"
 	return markdown
 def dict_to_markdown_table(data, key_column_name: str, value_column_name: str):
 	# Check if the input is a dictionary
 	if not isinstance(data, dict):
 		raise ValueError("Input must be a dictionary")
 	# Create the header of the table
 	header = f"| {key_column_name} | {value_column_name} |\n| :---: | :-----: |\n"
 	# Create the rows of the table
 	rows = ""
 	for key, value in data.items():
 		rows += f"| {key} | {value} |\n"
 	# Combine header and rows
 	markdown_table = header + rows
 	return markdown_table
 def embedding_query_content(
 	queries: List[str],
 	contents_list: List[List[str]],
 	embedding_model: Optional[str] = None,
 	batch: int = 128,
 ):
 	flatten_contents = list(itertools.chain.from_iterable(contents_list))
 	openai_embedding_limit = 8000  # all openai embedding model has 8000 max token input
 	if isinstance(embedding_model, OpenAIEmbedding):
 		queries = openai_truncate_by_token(
 			queries, openai_embedding_limit, embedding_model.model_name
 		)
 		flatten_contents = openai_truncate_by_token(
 			flatten_contents, openai_embedding_limit, embedding_model.model_name
 		)
 	# Embedding using batch
 	embedding_model.embed_batch_size = batch
 	query_embeddings = embedding_model.get_text_embedding_batch(queries)
 	content_lengths = list(map(len, contents_list))
 	content_embeddings_flatten = embedding_model.get_text_embedding_batch(
 		flatten_contents
 	)
 	content_embeddings = reconstruct_list(content_embeddings_flatten, content_lengths)
 	return query_embeddings, content_embeddings
 def to_list(item):
 	"""Recursively convert collections to Python lists."""
 	if isinstance(item, np.ndarray):
 		# Convert numpy array to list and recursively process each element
 		return [to_list(sub_item) for sub_item in item.tolist()]
 	elif isinstance(item, pd.Series):
 		# Convert pandas Series to list and recursively process each element
 		return [to_list(sub_item) for sub_item in item.tolist()]
 	elif isinstance(item, Iterable) and not isinstance(
 		item, (str, bytes, BaseModel, BM)
 	):
 		# Recursively process each element in other iterables
 		return [to_list(sub_item) for sub_item in item]
 	else:
 		return item
 def convert_inputs_to_list(func):
 	"""Decorator to convert all function inputs to Python lists."""
 	@functools.wraps(func)
 	def wrapper(*args, **kwargs):
 		new_args = [to_list(arg) for arg in args]
 		new_kwargs = {k: to_list(v) for k, v in kwargs.items()}
 		return func(*new_args, **new_kwargs)
 	return wrapper
 def get_best_row(
 	summary_df: pd.DataFrame, best_column_name: str = "is_best"
 ) -> pd.Series:
 	"""
 	From the summary dataframe, find the best result row by 'is_best' column and return it.
 	:param summary_df: Summary dataframe created by AutoRAG.
 	:param best_column_name: The column name that indicates the best result.
 	    Default is 'is_best'.
 	    You don't have to change this unless the column name is different.
 	:return: Best row pandas Series instance.
 	"""
 	bests = summary_df.loc[summary_df[best_column_name]]
 	assert len(bests) == 1, "There must be only one best result."
 	return bests.iloc[0]
 def get_event_loop() -> AbstractEventLoop:
 	"""
 	Get asyncio event loop safely.
 	"""
 	try:
 		loop = asyncio.get_running_loop()
 	except RuntimeError:
 		loop = asyncio.new_event_loop()
 		asyncio.set_event_loop(loop)
 	return loop
 def find_key_values(data, target_key: str) -> List[Any]:
 	"""
 	Recursively find all values for a specific key in a nested dictionary or list.
 	:param data: The dictionary or list to search.
 	:param target_key: The key to search for.
 	:return: A list of values associated with the target key.
 	"""
 	values = []
 	if isinstance(data, dict):
 		for key, value in data.items():
 			if key == target_key:
 				values.append(value)
 			if isinstance(value, (dict, list)):
 				values.extend(find_key_values(value, target_key))
 	elif isinstance(data, list):
 		for item in data:
 			if isinstance(item, (dict, list)):
 				values.extend(find_key_values(item, target_key))
 	return values
 def pop_params(func: Callable, kwargs: Dict) -> Dict:
 	"""
 	Pop parameters from the given func and return them.
 	It automatically deletes the parameters like "self" or "cls".
 	:param func: The function to pop parameters.
 	:param kwargs: kwargs to pop parameters.
 	:return: The popped parameters.
 	"""
 	ignore_params = ["self", "cls"]
 	target_params = list(inspect.signature(func).parameters.keys())
 	target_params = list(filter(lambda x: x not in ignore_params, target_params))
 	init_params = {}
 	kwargs_keys = list(kwargs.keys())
 	for key in kwargs_keys:
 		if key in target_params:
 			init_params[key] = kwargs.pop(key)
 	return init_params
 def apply_recursive(func, data):
 	"""
 	Recursively apply a function to all elements in a list, tuple, set, np.ndarray, or pd.Series and return as List.
 	:param func: Function to apply to each element.
 	:param data: List or nested list.
 	:return: List with the function applied to each element.
 	"""
 	if (
 		isinstance(data, list)
 		or isinstance(data, tuple)
 		or isinstance(data, set)
 		or isinstance(data, np.ndarray)
 		or isinstance(data, pd.Series)
 	):
 		return [apply_recursive(func, item) for item in data]
 	else:
 		return func(data)
 def empty_cuda_cache():
 	try:
 		import torch
 		if torch.cuda.is_available():
 			torch.cuda.empty_cache()
 	except ImportError:
 		pass
 def load_yaml_config(yaml_path: str) -> Dict:
 	"""
 	Load a YAML configuration file for AutoRAG.
 	It contains safe loading, converting string to tuple, and insert environment variables.
 	:param yaml_path: The path of the YAML configuration file.
 	:return: The loaded configuration dictionary.
 	"""
 	if not os.path.exists(yaml_path):
 		raise ValueError(f"YAML file {yaml_path} does not exist.")
 	with open(yaml_path, "r", encoding="utf-8") as stream:
 		try:
 			yaml_dict = yaml.safe_load(stream)
 		except yaml.YAMLError as exc:
 			raise ValueError(f"YAML file {yaml_path} could not be loaded.") from exc
 	yaml_dict = convert_string_to_tuple_in_dict(yaml_dict)
 	yaml_dict = convert_env_in_dict(yaml_dict)
 	return yaml_dict
 def decode_multiple_json_from_bytes(byte_data: bytes) -> list:
 	"""
 	Decode multiple JSON objects from bytes received from SSE server.
 	Args:
 	        byte_data: Bytes containing one or more JSON objects
 	Returns:
 	        List of decoded JSON objects
 	"""
 	# Decode bytes to string
 	try:
 		text_data = byte_data.decode("utf-8").strip()
 	except UnicodeDecodeError:
 		raise ValueError("Invalid byte data: Unable to decode as UTF-8")
 	# Initialize decoder and result list
 	decoder = JSONDecoder()
 	result = []
 	# Keep track of position in string
 	pos = 0
 	text_data = text_data.strip()
 	while pos < len(text_data):
 		try:
 			# Try to decode next JSON object
 			json_obj, json_end = decoder.raw_decode(text_data[pos:])
 			result.append(json_obj)
 			# Move position to end of current JSON object
 			pos += json_end
 			# Skip any whitespace
 			while pos < len(text_data) and text_data[pos].isspace():
 				pos += 1
 		except json.JSONDecodeError:
 			# If we can't decode at current position, move forward one character
 			pos += 1
 	return result
--- a/dashboard.sh
+++ b/dashboard.sh
@@ -0,0 +1,7 @@
 #!/bin/bash
 python3 -m autorag.cli dashboard \
    --trial_dir /usr/src/app/projects/benchmark_sample/1 \
    --port 7690
 echo "📊 AutoRAG 대시보드 실행 중..."
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -0,0 +1,22 @@
 services:
  autorag-dashboard:
    build:
      context: .
    container_name: autorag-dashboard
    environment:
      - CUDA_VISIBLE_DEVICES=0
      - OPENAI_API_KEY=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
      - BOKEH_ALLOW_WS_ORIGIN=172.16.10.175:7690
    volumes:
      - ~/.cache/huggingface:/root/.cache/huggingface
      - ./:/usr/src/app/
    tty: true
    working_dir: /usr/src/app
    networks:
      - autorag-dashboard_network
    ports:
      - "7690:7690"
 networks:
  autorag-dashboard_network:
    driver: bridge
--- a/projects/benchmark_sample/0/config.yaml
+++ b/projects/benchmark_sample/0/config.yaml
@@ -0,0 +1,92 @@
 vectordb:
  - name: chroma_dragonkue2
    db_type: chroma
    client_type: persistent
    embedding_model: huggingface_drangonku-v2-ko
    collection_name: huggingface_drangonku-v2-ko
    path: ${PROJECT_DIR}/resources/chroma
 node_lines:
 - node_line_name: retrieve_node_line  # Arbitrary node line name
  nodes:
    - node_type: retrieval
      strategy:
        metrics: [ retrieval_f1, retrieval_recall, retrieval_precision,
                   retrieval_ndcg, retrieval_map, retrieval_mrr ]
        speed_threshold: 10
      top_k: 10
      modules:
        - module_type: bm25
          bm25_tokenizer: [ ko_kiwi, ko_okt ]
        - module_type: vectordb
          vectordb: chroma_dragonkue2 # chromadb
        - module_type: hybrid_cc
          normalize_method: [ mm, tmm, z, dbsf ]
          target_modules: ('bm25', 'vectordb')
          weight_range: (0.6, 0.4)
          test_weight_size: 101
    - node_type: passage_reranker # re-ranker
      strategy:
        metrics:
        - retrieval_recall
        - retrieval_precision
        - retrieval_map
      modules:
      - module_type: dragonkue2
        top_k: 5
 - node_line_name: post_retrieve_node_line # 생성노드
  nodes:
  - node_type: prompt_maker
    strategy:
      metrics:
      - metric_name: bleu
      - metric_name: meteor
      - metric_name: rouge
      - metric_name: sem_score
        embedding_model: huggingface_drangonku-v2-ko  # raise ValueError("Only one embedding model is supported")
        lang: ko
      generator_modules:
      - module_type: llama_index_llm
        llm: ollama
        model: [ gemma3:12b, phi4, deepseek-r1:14b, aya-expanse:8b ]
        request_timeout: 3000.0
    modules:
      - module_type: fstring
        prompt:
        - |
          ### Task:
          Respond to the user query using the provided context.
          ### Guidelines:
          - If you don't know the answer, clearly state that.
          - If uncertain, ask the user for clarification.
          - Respond in the same language as the user's query.
          - If the context is unreadable or of poor quality, inform the user and provide the best possible answer.
          - If the answer isn't present in the context but you possess the knowledge, explain this to the user and provide the answer using your own understanding.
          - Do not use XML tags in your response.
          ### Output:
          Provide a clear and direct response to the user's query.
          <context>
          {retrieved_contents}
          </context>
          <user_query>
          {query}
          </user_query>
  - node_type: generator # Gen-LLM
    strategy: 
      metrics:
      - metric_name: bleu
      - metric_name: meteor
      - metric_name: rouge
      - metric_name: sem_score
    modules:
    - module_type: llama_index_llm
      llm: ollama
      model: gemma3:12b  # phi4, deepseek-r1:14b, aya-expanse:8b
      temperature: 0.0 
      request_timeout: 30000.0
      batch: 4
--- a/projects/benchmark_sample/1/config.yaml
+++ b/projects/benchmark_sample/1/config.yaml
@@ -0,0 +1,92 @@
 vectordb:
  - name: chroma_dragonkue2
    db_type: chroma
    client_type: persistent
    embedding_model: huggingface_drangonku-v2-ko
    collection_name: huggingface_drangonku-v2-ko
    path: ${PROJECT_DIR}/resources/chroma
 node_lines:
 - node_line_name: retrieve_node_line  # Arbitrary node line name
  nodes:
    - node_type: retrieval
      strategy:
        metrics: [ retrieval_f1, retrieval_recall, retrieval_precision,
                   retrieval_ndcg, retrieval_map, retrieval_mrr ]
        speed_threshold: 10
      top_k: 10
      modules:
        - module_type: bm25
          bm25_tokenizer: [ ko_kiwi ] # ko_kiwi, ko_okt
        - module_type: vectordb
          vectordb: chroma_dragonkue2 # chromadb
        - module_type: hybrid_cc
          normalize_method: [ mm, tmm, z, dbsf ]
          target_modules: ('bm25', 'vectordb')
          weight_range: (0.6, 0.4)
          test_weight_size: 101
    - node_type: passage_reranker # re-ranker
      strategy:
        metrics:
        - retrieval_recall
        - retrieval_precision
        - retrieval_map
      modules:
      - module_type: dragonkue2
        top_k: 5
 - node_line_name: post_retrieve_node_line # 생성노드
  nodes:
  - node_type: prompt_maker
    strategy:
      metrics:
      - metric_name: bleu
      - metric_name: meteor
      - metric_name: rouge
      - metric_name: sem_score
        embedding_model: huggingface_drangonku-v2-ko  # raise ValueError("Only one embedding model is supported")
        lang: ko
      generator_modules:
      - module_type: llama_index_llm
        llm: ollama
        model: gemma3:12b
        request_timeout: 3000.0
    modules:
      - module_type: fstring
        prompt:
        - |
          ### 작업:  
          지침에 따라 제공된 컨텍스트를 활용하여 사용자 질문에 답변하세요.  
          ### 지침:  
          - 답을 모를 경우, 모른다고 명확히 말하세요.  
          - 확신이 없다면, 사용자에게 추가 설명을 요청하세요.  
          - 사용자의 질문과 동일한 언어로 답변하세요.  
          - 컨텍스트가 읽기 어렵거나 품질이 낮을 경우, 이를 사용자에게 알리고 최선의 답변을 제공하세요.  
          - 컨텍스트에 답이 없지만 알고 있는 내용이라면, 이를 사용자에게 설명하고 자신의 지식을 바탕으로 답변하세요.  
          - XML 태그를 사용하지 마세요.  
          ### 출력:  
          사용자의 질문에 대해 명확하고 직접적인 답변을 제공하세요.
          <context>
          {retrieved_contents}
          </context>
          <user_query>
          {query}
          </user_query>
  - node_type: generator # Gen-LLM
    strategy: 
      metrics:
      - metric_name: bleu
      - metric_name: meteor
      - metric_name: rouge
      - metric_name: sem_score
    modules:
    - module_type: llama_index_llm
      llm: ollama
      model: gemma3:12b  # phi4, deepseek-r1:14b, aya-expanse:8b
      temperature: 0.0 
      request_timeout: 300.0
      batch: 8
--- a/projects/benchmark_sample/1/post_retrieve_node_line/generator/0.parquet
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/generator/0.parquet
--- a/projects/benchmark_sample/1/post_retrieve_node_line/generator/best_0.parquet
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/generator/best_0.parquet
--- a/projects/benchmark_sample/1/post_retrieve_node_line/generator/summary.csv
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/generator/summary.csv
@@ -0,0 +1,2 @@
 filename,module_name,module_params,execution_time,average_output_token,bleu,meteor,rouge,sem_score,is_best
 0.parquet,LlamaIndexLLM,"{'llm': 'ollama', 'model': 'gemma3:12b', 'temperature': 0.0, 'request_timeout': 300.0, 'batch': 8}",0.8519447922706604,259.05,14.57290077698799,0.47984407229799053,0.4400396825396825,0.8177114641079747,True
--- a/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/0.parquet
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/0.parquet
--- a/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/best_0.parquet
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/best_0.parquet
--- a/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/summary.csv
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/prompt_maker/summary.csv
@@ -0,0 +1,2 @@
 filename,module_name,module_params,execution_time,average_prompt_token,is_best
 0.parquet,Fstring,"{'prompt': '### 작업:  \n지침에 따라 제공된 컨텍스트를 활용하여 사용자 질문에 답변하세요.  \n\n### 지침:  \n- 답을 모를 경우, 모른다고 명확히 말하세요.  \n- 확신이 없다면, 사용자에게 추가 설명을 요청하세요.  \n- 사용자의 질문과 동일한 언어로 답변하세요.  \n- 컨텍스트가 읽기 어렵거나 품질이 낮을 경우, 이를 사용자에게 알리고 최선의 답변을 제공하세요.  \n- 컨텍스트에 답이 없지만 알고 있는 내용이라면, 이를 사용자에게 설명하고 자신의 지식을 바탕으로 답변하세요.  \n- XML 태그를 사용하지 마세요.  \n\n### 출력:  \n사용자의 질문에 대해 명확하고 직접적인 답변을 제공하세요.\n\n<context>\n{retrieved_contents}\n</context>\n\n<user_query>\n{query}\n</user_query>\n'}",0.0003142237663269043,2751.85,True
--- a/projects/benchmark_sample/1/post_retrieve_node_line/summary.csv
+++ b/projects/benchmark_sample/1/post_retrieve_node_line/summary.csv
@@ -0,0 +1,3 @@
 node_type,best_module_filename,best_module_name,best_module_params,best_execution_time
 prompt_maker,0.parquet,Fstring,"{'prompt': '### 작업:  \n지침에 따라 제공된 컨텍스트를 활용하여 사용자 질문에 답변하세요.  \n\n### 지침:  \n- 답을 모를 경우, 모른다고 명확히 말하세요.  \n- 확신이 없다면, 사용자에게 추가 설명을 요청하세요.  \n- 사용자의 질문과 동일한 언어로 답변하세요.  \n- 컨텍스트가 읽기 어렵거나 품질이 낮을 경우, 이를 사용자에게 알리고 최선의 답변을 제공하세요.  \n- 컨텍스트에 답이 없지만 알고 있는 내용이라면, 이를 사용자에게 설명하고 자신의 지식을 바탕으로 답변하세요.  \n- XML 태그를 사용하지 마세요.  \n\n### 출력:  \n사용자의 질문에 대해 명확하고 직접적인 답변을 제공하세요.\n\n<context>\n{retrieved_contents}\n</context>\n\n<user_query>\n{query}\n</user_query>\n'}",0.0003142237663269
 generator,0.parquet,LlamaIndexLLM,"{'llm': 'ollama', 'model': 'gemma3:12b', 'temperature': 0.0, 'request_timeout': 300.0, 'batch': 8}",0.8519447922706604
--- a/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/0.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/0.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/best_0.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/best_0.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/summary.csv
+++ b/projects/benchmark_sample/1/retrieve_node_line/passage_reranker/summary.csv
@@ -0,0 +1,2 @@
 filename,module_name,module_params,execution_time,passage_reranker_retrieval_recall,passage_reranker_retrieval_precision,passage_reranker_retrieval_map,is_best
 0.parquet,DragonKue2,{'top_k': 5},0.12188564538955689,0.3,0.06,0.18916666666666665,True
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/0.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/0.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/1.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/1.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/2.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/2.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/3.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/3.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/4.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/4.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/5.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/5.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/best_2.parquet
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/best_2.parquet
--- a/projects/benchmark_sample/1/retrieve_node_line/retrieval/summary.csv
+++ b/projects/benchmark_sample/1/retrieve_node_line/retrieval/summary.csv
@@ -0,0 +1,7 @@
 filename,module_name,module_params,execution_time,retrieval_f1,retrieval_recall,retrieval_precision,retrieval_ndcg,retrieval_map,retrieval_mrr,is_best
 0.parquet,VectorDB,"{'top_k': 10, 'vectordb': 'chroma_dragonkue2'}",0.10161013603210449,0.045454545454545456,0.25,0.025,0.14013009087326042,0.10625,0.10625,False
 1.parquet,BM25,"{'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'}",1.9859044432640076,0.03636363636363636,0.2,0.02,0.07248116240107563,0.034999999999999996,0.034999999999999996,False
 2.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'dbsf', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.516, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112,0.06363636363636363,0.35,0.035,0.20447427813233116,0.16041666666666665,0.16041666666666665,True
 3.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'mm', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.51, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112,0.06363636363636363,0.35,0.035,0.20447427813233116,0.16041666666666665,0.16041666666666665,False
 4.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'tmm', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.454, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112,0.05454545454545454,0.3,0.03,0.15007396002669662,0.10499999999999998,0.10499999999999998,False
 5.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'z', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.516, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112,0.06363636363636363,0.35,0.035,0.20447427813233116,0.16041666666666665,0.16041666666666665,False
--- a/projects/benchmark_sample/1/retrieve_node_line/summary.csv
+++ b/projects/benchmark_sample/1/retrieve_node_line/summary.csv
@@ -0,0 +1,3 @@
 node_type,best_module_filename,best_module_name,best_module_params,best_execution_time
 retrieval,2.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'dbsf', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.516, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112
 passage_reranker,0.parquet,DragonKue2,{'top_k': 5},0.1218856453895568
--- a/projects/benchmark_sample/1/summary.csv
+++ b/projects/benchmark_sample/1/summary.csv
@@ -0,0 +1,5 @@
 node_line_name,node_type,best_module_filename,best_module_name,best_module_params,best_execution_time
 retrieve_node_line,retrieval,2.parquet,HybridCC,"{'top_k': 10, 'normalize_method': 'dbsf', 'target_modules': ('VectorDB', 'BM25'), 'weight': 0.516, 'target_module_params': ({'top_k': 10, 'vectordb': 'chroma_dragonkue2'}, {'top_k': 10, 'bm25_tokenizer': 'ko_kiwi'})}",2.087514579296112
 retrieve_node_line,passage_reranker,0.parquet,DragonKue2,{'top_k': 5},0.1218856453895568
 post_retrieve_node_line,prompt_maker,0.parquet,Fstring,"{'prompt': '### 작업:  \n지침에 따라 제공된 컨텍스트를 활용하여 사용자 질문에 답변하세요.  \n\n### 지침:  \n- 답을 모를 경우, 모른다고 명확히 말하세요.  \n- 확신이 없다면, 사용자에게 추가 설명을 요청하세요.  \n- 사용자의 질문과 동일한 언어로 답변하세요.  \n- 컨텍스트가 읽기 어렵거나 품질이 낮을 경우, 이를 사용자에게 알리고 최선의 답변을 제공하세요.  \n- 컨텍스트에 답이 없지만 알고 있는 내용이라면, 이를 사용자에게 설명하고 자신의 지식을 바탕으로 답변하세요.  \n- XML 태그를 사용하지 마세요.  \n\n### 출력:  \n사용자의 질문에 대해 명확하고 직접적인 답변을 제공하세요.\n\n<context>\n{retrieved_contents}\n</context>\n\n<user_query>\n{query}\n</user_query>\n'}",0.0003142237663269
 post_retrieve_node_line,generator,0.parquet,LlamaIndexLLM,"{'llm': 'ollama', 'model': 'gemma3:12b', 'temperature': 0.0, 'request_timeout': 300.0, 'batch': 8}",0.8519447922706604
--- a/projects/benchmark_sample/data/corpus.parquet
+++ b/projects/benchmark_sample/data/corpus.parquet
--- a/projects/benchmark_sample/data/qa.parquet
+++ b/projects/benchmark_sample/data/qa.parquet
--- a/projects/benchmark_sample/resources/bm25_ko_kiwi.pkl
+++ b/projects/benchmark_sample/resources/bm25_ko_kiwi.pkl
--- a/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/data_level0.bin
+++ b/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/data_level0.bin
--- a/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/header.bin
+++ b/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/header.bin
--- a/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/index_metadata.pickle
+++ b/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/index_metadata.pickle
--- a/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/length.bin
+++ b/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/length.bin
--- a/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/link_lists.bin
+++ b/projects/benchmark_sample/resources/chroma/985a388c-103b-4534-a1a5-d7088ed74c0c/link_lists.bin
--- a/projects/benchmark_sample/resources/chroma/chroma.sqlite3
+++ b/projects/benchmark_sample/resources/chroma/chroma.sqlite3
--- a/projects/benchmark_sample/resources/vectordb.yaml
+++ b/projects/benchmark_sample/resources/vectordb.yaml
@@ -0,0 +1,7 @@
 vectordb:
 - client_type: persistent
  collection_name: huggingface_drangonku-v2-ko
  db_type: chroma
  embedding_model: huggingface_drangonku-v2-ko
  name: chroma_dragonkue2
  path: ../projects/daesan-dangjin_01/benchmark/resources/chroma
--- a/projects/benchmark_sample/trial.json
+++ b/projects/benchmark_sample/trial.json
@@ -0,0 +1,10 @@
 [
    {
        "trial_name": "0",
        "start_time": "2025-03-13 07:47:00"
    },
    {
        "trial_name": "1",
        "start_time": "2025-03-13 08:03:47"
    }
 ]
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -0,0 +1,149 @@
 [build-system]
 requires = ["setuptools", "setuptools-scm"]
 build-backend = "setuptools.build_meta"
 [project]
 name = "AutoRAG"
 authors = [
    { name = "Marker-Inc", email = "vkehfdl1@gmail.com" }
 ]
 description = 'Automatically Evaluate RAG pipelines with your own data. Find optimal structure for new RAG product.'
 readme = "README.md"
 requires-python = ">=3.10"
 keywords = ['RAG', 'AutoRAG', 'autorag', 'rag-evaluation', 'evaluation', 'rag-auto', 'AutoML', 'AutoML-RAG']
 license = { file = "LICENSE" }
 classifiers = [
    "Intended Audience :: Developers",
    "Intended Audience :: Information Technology",
    "Intended Audience :: Science/Research",
    'Programming Language :: Python :: 3.10',
    'Programming Language :: Python :: 3.11',
    'Programming Language :: Python :: 3.12',
    "Topic :: Scientific/Engineering :: Artificial Intelligence",
    "Topic :: Software Development :: Libraries",
    "Topic :: Software Development :: Libraries :: Python Modules",
 ]
 urls = { Homepage = "https://github.com/Marker-Inc-Korea/AutoRAG" }
 dynamic = ["version", "dependencies"]
 [tool.poetry]
 name = "AutoRAG"
 version = "0.0.2" #initial version
 description = "Automatically Evaluate RAG pipelines with your own data. Find optimal structure for new RAG product."
 authors = ["Marker-Inc <vkehfdl1@gmail.com>"]
 [tool.setuptools.dynamic]
 version = { file = ["autorag/VERSION"] }
 dependencies = { file = ["requirements.txt"] }
 [tool.setuptools]
 include-package-data = true
 [tool.setuptools.packages.find]
 where = ["."]
 include = ["autorag*"]
 exclude = ["tests"]
 [tool.pytest.ini_options]
 pythonpath = ["."]
 testpaths = ["tests"]
 addopts = ["--import-mode=importlib"] # default is prepend
 [project.optional-dependencies]
 ko = ["kiwipiepy >= 0.18.0", "konlpy"]
 dev = ["ruff", "pre-commit"]
 parse = ["PyMuPDF", "pdfminer.six", "pdfplumber", "unstructured", "jq", "unstructured[pdf]", "PyPDF2<3.0", "pdf2image"]
 ja = ["sudachipy>=0.6.8", "sudachidict_core"]
 gpu = ["torch", "sentencepiece", "bert_score", "optimum[openvino,nncf]", "peft", "llmlingua", "FlagEmbedding",
    "sentence-transformers", "transformers", "llama-index-llms-ollama", "llama-index-embeddings-huggingface",
    "llama-index-llms-huggingface", "onnxruntime"]
 all = ["AutoRAG[gpu]", "AutoRAG[ko]", "AutoRAG[dev]", "AutoRAG[parse]", "AutoRAG[ja]"]
 [project.entry-points.console_scripts]
 autorag = "autorag.cli:cli"
 [tool.ruff]
 # Exclude a variety of commonly ignored directories.
 exclude = [
    ".bzr",
    ".direnv",
    ".eggs",
    ".git",
    ".git-rewrite",
    ".hg",
    ".ipynb_checkpoints",
    ".mypy_cache",
    ".nox",
    ".pants.d",
    ".pyenv",
    ".pytest_cache",
    ".pytype",
    ".ruff_cache",
    ".svn",
    ".tox",
    ".venv",
    ".vscode",
    "__pypackages__",
    "_build",
    "buck-out",
    "build",
    "dist",
    "node_modules",
    "site-packages",
    "venv",
 ]
 # Same as Black.
 line-length = 88
 indent-width = 4
 # Assume Python 3.9
 target-version = "py39"
 [tool.ruff.lint]
 # Enable Pyflakes (`F`) and a subset of the pycodestyle (`E`)  codes by default.
 # Unlike Flake8, Ruff doesn't enable pycodestyle warnings (`W`) or
 # McCabe complexity (`C901`) by default.
 select = ["E4", "E7", "E9", "F"]
 ignore = ["E722", "F821"]
 # Allow fix for all enabled rules (when `--fix`) is provided.
 fixable = ["ALL"]
 unfixable = ["B"]
 # Allow unused variables when underscore-prefixed.
 dummy-variable-rgx = "^(_+|(_+[a-zA-Z0-9_]*[a-zA-Z0-9]+?))$"
 [tool.ruff.lint.per-file-ignores]
 "__init__.py" = ["E402", "F401"]
 "**/{docs}/*" = ["E402", "F401"]
 "test_*.py" = ["F401", "F811"]
 "*_test.py" = ["F401", "F811"]
 "resources/parse_data/*" = ["W292"]
 [tool.ruff.format]
 # Like Black, use double quotes for strings.
 quote-style = "double"
 # Like Black, indent with spaces, rather than tabs.
 indent-style = "tab"
 # Like Black, respect magic trailing commas.
 skip-magic-trailing-comma = false
 # Like Black, automatically detect the appropriate line ending.
 line-ending = "auto"
 # Enable auto-formatting of code examples in docstrings. Markdown,
 # reStructuredText code/literal blocks and doctests are all supported.
 #
 # This is currently disabled by default, but it is planned for this
 # to be opt-out in the future.
 docstring-code-format = true
 # Set the line length limit used when formatting code snippets in
 # docstrings.
 #
 # This only has an effect when the `docstring-code-format` setting is
 # enabled.
 docstring-code-line-length = "dynamic"
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,69 @@
 pydantic<2.10.0 # incompatible with llama index
 numpy<2.0.0 # temporal not using numpy 2.0.0
 pandas>=2.1.0
 tqdm
 tiktoken>=0.7.0  # for counting token
 openai>=1.0.0
 rank_bm25  # for bm25 retrieval
 pyyaml  # for yaml file
 pyarrow  # for pandas with parquet
 fastparquet  # for pandas with parquet
 sacrebleu  # for bleu score
 evaluate  # for meteor and other scores
 rouge_score  # for rouge score
 rich  # for pretty logging
 click  # for cli
 cohere>=5.8.0 # for cohere services
 tokenlog>=0.0.2 # for token logging
 aiohttp # for async http requests
 voyageai # for voyageai reranker
 mixedbread-ai # for mixedbread-ai reranker
 llama-index-llms-bedrock
 scikit-learn
 emoji
 ### Vector DB ###
 pymilvus>=2.3.0 # for using milvus vectordb
 chromadb>=0.5.0 # for chroma vectordb
 weaviate-client # for weaviate vectordb
 pinecone[grpc] # for pinecone vectordb
 couchbase # for couchbase vectordb
 qdrant-client # for qdrant vectordb
 ### API server ###
 quart
 pyngrok
 ### LlamaIndex ###
 llama-index>=0.11.0
 llama-index-core=0.12.24
 # readers
 llama-index-readers-file
 # Embeddings
 llama-index-embeddings-openai
 llama-index-embeddings-ollama
 # LLMs
 llama-index-llms-openai>=0.2.7
 llama-index-llms-openai-like
 # Retriever
 llama-index-retrievers-bm25
 # WebUI
 streamlit
 gradio
 ### Langchain ###
 langchain-core>=0.3.0
 langchain-unstructured>=0.1.5
 langchain-upstage
 langchain-community>=0.3.0
 # autorag dashboard
 panel
 seaborn
 ipykernel
 ipywidgets
 ipywidgets_bokeh
 # added library - 김용연
 llama_index.llms.ollama
 llama_index.embeddings.huggingface
		`@@ -0,0 +1,2 @@`
							`filename,module_name,module_params,execution_time,average_output_token,bleu,meteor,rouge,sem_score,is_best`
							`0.parquet,LlamaIndexLLM,"{'llm': 'ollama', 'model': 'gemma3:12b', 'temperature': 0.0, 'request_timeout': 300.0, 'batch': 8}",0.8519447922706604,259.05,14.57290077698799,0.47984407229799053,0.4400396825396825,0.8177114641079747,True`
		`@@ -0,0 +1,2 @@`
							`filename,module_name,module_params,execution_time,average_prompt_token,is_best`
							0.parquet,Fstring,"{'prompt': '### 작업: \n지침에 따라 제공된 컨텍스트를 활용하여 사용자 질문에 답변하세요. \n\n### 지침: \n- 답을 모를 경우, 모른다고 명확히 말하세요. \n- 확신이 없다면, 사용자에게 추가 설명을 요청하세요. \n- 사용자의 질문과 동일한 언어로 답변하세요. \n- 컨텍스트가 읽기 어렵거나 품질이 낮을 경우, 이를 사용자에게 알리고 최선의 답변을 제공하세요. \n- 컨텍스트에 답이 없지만 알고 있는 내용이라면, 이를 사용자에게 설명하고 자신의 지식을 바탕으로 답변하세요. \n- XML 태그를 사용하지 마세요. \n\n### 출력: \n사용자의 질문에 대해 명확하고 직접적인 답변을 제공하세요.\n\n<context>\n{retrieved_contents}\n</context>\n\n<user_query>\n{query}\n</user_query>\n'}",0.0003142237663269043,2751.85,True
		`@@ -0,0 +1,2 @@`
							`filename,module_name,module_params,execution_time,passage_reranker_retrieval_recall,passage_reranker_retrieval_precision,passage_reranker_retrieval_map,is_best`
							`0.parquet,DragonKue2,{'top_k': 5},0.12188564538955689,0.3,0.06,0.18916666666666665,True`