diff --git a/ontoaligner/pipeline.py b/ontoaligner/pipeline.py
index 8a399c5..8e4c3f0 100644
--- a/ontoaligner/pipeline.py
+++ b/ontoaligner/pipeline.py
@@ -1,28 +1,43 @@
+"""
+Ontology Alignment Pipeline. Various methods such as lightweight matching, retriever-based matching, LLM-based matching,
+and RAG (Retriever-Augmented Generation) techniques has been applied.
+"""
 import json
 from pathlib import Path
+from tqdm import tqdm
 from torch.utils.data import DataLoader
 from torch.utils.data import Dataset
-from typing import Any
+from typing import Any, Dict
+from sklearn.linear_model import LogisticRegression
 
-# Import necessary modules from the ontoaligner library
 from ontoaligner.base import BaseEncoder, BaseOMModel, OMDataset
-from ontoaligner.encoder import ConceptLightweightEncoder, ConceptLLMEncoder
+from ontoaligner.encoder import ConceptLightweightEncoder, ConceptLLMEncoder, ConceptRAGEncoder, ConceptParentFewShotEncoder
 from ontoaligner.utils import metrics, xmlify
 from ontoaligner.ontology_matchers import SimpleFuzzySMLightweight, SBERTRetrieval, AutoModelDecoderLLM, ConceptLLMDataset
-from ontoaligner.postprocess import retriever_postprocessor, llm_postprocessor
-
+from ontoaligner.postprocess import retriever_postprocessor, llm_postprocessor, rag_hybrid_postprocessor, TFIDFLabelMapper, LabelMapper
 
 class OntoAlignerPipeline:
     """
-        A pipeline for performing ontology alignment tasks using various methods and models.
+    A pipeline for performing ontology alignment tasks using various methods and models.
     """
     def __init__(self, task_class: OMDataset, source_ontology_path: str, target_ontology_path: str,
-                 reference_matching_path: str, output_path: str ="results", output_format: str ="xml"):
+                 reference_matching_path: str, output_dir: str ="results", output_format: str ="xml"):
+        """
+        Initializes the OntoAlignerPipeline.
+
+        Parameters:
+            task_class (OMDataset): Class responsible for handling ontology matching tasks.
+            source_ontology_path (str): Path to the source ontology file.
+            target_ontology_path (str): Path to the target ontology file.
+            reference_matching_path (str): Path to the reference alignments.
+            output_dir (str, optional): Directory to save results. Defaults to "results".
+            output_format (str, optional): Format of output files. Defaults to "xml".
+        """
         self.task_class = task_class
         self.source_ontology_path = source_ontology_path
         self.target_ontology_path = target_ontology_path
         self.reference_matching_path = reference_matching_path
-        self.output_path = Path(output_path)
+        self.output_dir = Path(output_dir)
         self.output_format = output_format.lower()
         self.task = self._initialize_task()
         self.dataset = self._collect_dataset()
@@ -49,9 +64,12 @@ def _collect_dataset(self):
             reference_matching_path=self.reference_matching_path
         )
 
-    def __call__(self, method: str,  encoder_model: BaseEncoder =None, model_class: BaseOMModel=None, dataset_class:Dataset =None, postprocessor: Any=None,
-                 llm_path: str=None, retriever_path: str=None, device: str="cuda", batch_size: int=2048, max_length: int=300, max_new_tokens: int=10,
-                 top_k: int=10, fuzzy_sm_threshold: float=0.2, evaluate: bool=True, return_matching: bool=False):
+    def __call__(self, method: str, encoder_model: BaseEncoder = None, model_class: BaseOMModel = None, dataset_class: Dataset = None, postprocessor: Any = None,
+                 llm_path: str = None, retriever_path: str = None, device: str = "cuda", batch_size: int = 2048, max_length: int = 300, max_new_tokens: int = 10,
+                 top_k: int = 10, fuzzy_sm_threshold: float = 0.2, evaluate: bool = False, return_matching: bool = True, output_file_name: str = "matchings",
+                 save_matchings: bool = False, ir_threshold: float = 0.5, llm_threshold: float = 0.5, llm_mapper: LabelMapper = None, llm_mapper_interested_class: str = 'yes',
+                 answer_set: Dict = {"yes": ["yes", "true"], "no": ["no", "false"]}, huggingface_access_token: str = "", openai_key: str = "", device_map: str = "auto",
+                 positive_ratio: float = 0.7, n_shots: int = 5) -> [Any, Any]:
         """
         Executes the ontology alignment process using the specified method.
 
@@ -69,116 +87,178 @@ def __call__(self, method: str,  encoder_model: BaseEncoder =None, model_class:
             max_new_tokens (int, optional): Maximum tokens to generate for LLM-based methods. Defaults to 10.
             top_k (int, optional): Number of top matches to retrieve in the retriever method. Defaults to 10.
             fuzzy_sm_threshold (float, optional): Threshold for fuzzy matching in lightweight methods. Defaults to 0.2.
-            evaluate (bool, optional): Whether to evaluate the matching results. Defaults to True.
-            return_matching (bool, optional): Whether to return the matching results. Defaults to False.
+            evaluate (bool, optional): Whether to evaluate the matching results. Defaults to False.
+            return_matching (bool, optional): Whether to return the matching results. Defaults to True.
+            output_file_name (str, optional): Output file name without file type. Defaults to "matchings".
+            save_matchings (bool, optional): Whether to save the matching results. Defaults to False.
+            ir_threshold (float, optional): Retrieval postprocessor threshold.
+            llm_threshold (float, optional): LLM postprocessor threshold.
+            llm_mapper (LabelMapper, optional): Mapper for LLM outputs.
+            llm_mapper_interested_class (str, optional): Class to filter output pairs in LLM postprocessing.
+            answer_set (dict, optional): Mapping of yes/no answers. Defaults to {"yes": ["yes", "true"], "no": ["no", "false"]}.
+            huggingface_access_token (str, optional): Access token for Hugging Face models. Defaults to "".
+            openai_key (str, optional): API key for OpenAI models. Defaults to "".
+            device_map (str, optional): Device map for model allocation. Defaults to "auto".
+            positive_ratio (float, optional): Ratio of positive examples in few-shot methods. Defaults to 0.7.
+            n_shots (int, optional): Number of shots for few-shot learning. Defaults to 5.
 
         Returns:
             dict or None: Evaluation report if `evaluate` is True. Matching results if `return_matching` is True.
         """
         if method == "lightweight":
-            return self._run_lightweight(encoder_model or ConceptLightweightEncoder(), model_class or SimpleFuzzySMLightweight,
-                                         postprocessor, fuzzy_sm_threshold, evaluate, return_matching)
-        elif method == "retriever":
-            return self._run_retriever(encoder_model or ConceptLightweightEncoder(), model_class or SBERTRetrieval,
-                                       postprocessor or retriever_postprocessor, retriever_path, top_k, evaluate, return_matching)
+            matchings = self._run_lightweight(encoder_model or ConceptLightweightEncoder(), model_class or SimpleFuzzySMLightweight,
+                                              postprocessor, fuzzy_sm_threshold)
+        elif method == "retrieval":
+            matchings = self._run_retriever(encoder_model or ConceptLightweightEncoder(), model_class or SBERTRetrieval, postprocessor or retriever_postprocessor,
+                                             retriever_path, device, top_k, ir_threshold)
         elif method == "llm":
-            return self._run_llm(encoder_model or ConceptLLMEncoder(), model_class or AutoModelDecoderLLM, dataset_class or ConceptLLMDataset,
-                                 postprocessor or llm_postprocessor, llm_path, device, batch_size, max_length, max_new_tokens, evaluate, return_matching)
-        elif method == 'rag':
-            return self._run_rag()
-        elif method == 'fewshot':
-            return self._run_fewshot_rag()
-        elif method == 'icv':
-            return self._run_icv_rag()
+            matchings = self._run_llm(encoder_model or ConceptLLMEncoder(), model_class or AutoModelDecoderLLM, dataset_class or ConceptLLMDataset,
+                                       postprocessor or llm_postprocessor, llm_mapper or TFIDFLabelMapper(classifier=LogisticRegression(), ngram_range=(1, 1)),
+                                       llm_mapper_interested_class, llm_path, device, batch_size, max_length, max_new_tokens, llm_threshold)
+        elif 'rag' in method:
+            retriever_config = {"device": device, "top_k": top_k, "threshold": ir_threshold, "openai_key": openai_key}
+            llm_config = {"device": device, "batch_size": batch_size, "answer_set": answer_set, "huggingface_access_token": huggingface_access_token,
+                          "max_length": max_length, "max_new_tokens": max_new_tokens, "openai_key": openai_key, "device_map": device_map}
+            rag_config = {"retriever_config": retriever_config, "llm_config": llm_config}
+            if method == 'fewshot-rag':
+                rag_config['n_shots'] = n_shots
+                rag_config['positive_ratio'] = positive_ratio
+                encoder_model = encoder_model or ConceptParentFewShotEncoder()
+            else:
+                encoder_model = encoder_model or ConceptRAGEncoder()
+            matchings = self._run_rag(method, encoder_model, model_class, postprocessor or rag_hybrid_postprocessor,
+                                      llm_threshold,  ir_threshold, retriever_path, llm_path, rag_config)
         else:
             raise ValueError(f"Unknown method: {method}")
+        return self._process_results(matchings, method, evaluate, return_matching, output_file_name, save_matchings)
 
-    def _run_lightweight(self, encoder_model, model_class, postprocessor, fuzzy_sm_threshold, evaluate, return_matching):
+    def _run_lightweight(self, encoder_model, model_class, postprocessor, fuzzy_sm_threshold):
         """
-        Runs the lightweight ontology alignment method.
+        Executes the lightweight ontology alignment method.
+
+        This method uses a lightweight matching model to generate ontology matchings
+        based on encoded source and target ontologies. Optionally, a postprocessor
+        is applied to refine the matching results.
 
         Parameters:
-            encoder_model (BaseEncoder): Encoder model for encoding ontologies.
-            model_class (BaseOMModel): Model class for lightweight matching.
-            postprocessor (Any): Post-processing function.
-            fuzzy_sm_threshold (float): Threshold for fuzzy matching.
-            evaluate (bool): Whether to evaluate the results.
-            return_matching (bool): Whether to return the matching results.
+            encoder_model (BaseEncoder): Encoder model to encode the source and target ontologies.
+            model_class (BaseOMModel): A class implementing the lightweight matching logic.
+            postprocessor (callable or None): A function to refine the matching results. Optional.
+            fuzzy_sm_threshold (float): Threshold value for fuzzy similarity matching in the model.
 
         Returns:
-            dict or None: Evaluation report if `evaluate` is True. Matching results if `return_matching` is True.
+            dict: The resulting matchings after encoding and processing.
         """
         encoder_output = encoder_model(source=self.dataset['source'], target=self.dataset['target'])
         model = model_class(fuzzy_sm_threshold=fuzzy_sm_threshold)
         matchings = model.generate(input_data=encoder_output)
         if postprocessor:
             matchings = postprocessor(matchings)
-        return self._process_results(matchings, "lightweight", evaluate, return_matching)
+        return matchings
 
-    def _run_retriever(self, encoder_model, model_class, postprocessor, retriever_path, top_k, evaluate, return_matching):
+    def _run_retriever(self, encoder_model, model_class, postprocessor, retriever_path, device, top_k, ir_threshold):
         """
-        Runs the retriever-based ontology alignment method.
+        Executes the retriever-based ontology alignment method.
+
+        This method leverages a retriever model to identify top-k potential matches
+        between ontologies based on their encoded representations. The results are
+        refined using a postprocessor.
 
         Parameters:
-            encoder_model (BaseEncoder): Encoder model for encoding ontologies.
-            model_class (BaseOMModel): Model class for retriever-based matching.
-            postprocessor (Any): Post-processing function.
-            retriever_path (str): Path to the retriever model.
-            top_k (int): Number of top matches to retrieve.
-            evaluate (bool): Whether to evaluate the results.
-            return_matching (bool): Whether to return the matching results.
+            encoder_model (BaseEncoder): Encoder model to encode the source and target ontologies.
+            model_class (BaseOMModel): A class implementing the retriever-based matching logic.
+            postprocessor (callable): A function to refine the matching results.
+            retriever_path (str): File path to the pretrained retriever model.
+            device (str): The computational device (e.g., 'cpu' or 'cuda').
+            top_k (int): Number of top candidate matches to retrieve.
+            ir_threshold (float): Threshold for the postprocessor to filter results.
 
         Returns:
-            dict or None: Evaluation report if `evaluate` is True. Matching results if `return_matching` is True.
+            dict: The resulting matchings after encoding, retrieval, and processing.
         """
         encoder_output = encoder_model(source=self.dataset['source'], target=self.dataset['target'])
-        model = model_class(device='cpu', top_k=top_k)
+        model = model_class(device=device, top_k=top_k)
         model.load(path=retriever_path)
         matchings = model.generate(input_data=encoder_output)
-        matchings = postprocessor(matchings)
-        return self._process_results(matchings, "retriever", evaluate, return_matching)
-
+        matchings = postprocessor(matchings, threshold=ir_threshold)
+        return matchings
 
-    def _run_llm(self, encoder_model, model_class, dataset_class, postprocessor, llm_path,
-                 device, batch_size, max_length, max_new_tokens, evaluate, return_matching):
+    def _run_llm(self, encoder_model, model_class, dataset_class, postprocessor, llm_mapper,
+                 llm_mapper_interested_class,
+                 llm_path, device, batch_size, max_length, max_new_tokens, llm_threshold):
         """
-        Runs the LLM-based ontology alignment method.
+        Executes the LLM-based ontology alignment method.
+
+        This method uses a large language model (LLM) to generate matching predictions
+        based on a dataset constructed from the encoded ontologies. The results are
+        postprocessed to align with the desired format and filtering criteria.
 
         Parameters:
-            encoder_model (BaseEncoder): Encoder model for encoding ontologies.
-            model_class (BaseOMModel): Model class for LLM-based matching.
-            dataset_class (Dataset): Dataset class for LLM-based methods.
-            postprocessor (Any): Post-processing function.
-            llm_path (str): Path to the LLM model.
-            device (str): Device to use for computation.
-            batch_size (int): Batch size for LLM-based methods.
-            max_length (int): Maximum input length for LLM-based methods.
-            max_new_tokens (int): Maximum tokens to generate.
-            evaluate (bool): Whether to evaluate the results.
-            return_matching (bool): Whether to return the matching results.
+            encoder_model (BaseEncoder): Encoder model to encode the source and target ontologies.
+            model_class (BaseOMModel): A class implementing LLM-based matching logic.
+            dataset_class (Dataset): A class to construct datasets for LLM-based methods.
+            postprocessor (callable): A function to refine the matching results.
+            llm_mapper (LabelMapper): A mapper to process LLM outputs into matchings.
+            llm_mapper_interested_class (str): Specific class of matchings to filter in the results.
+            llm_path (str): File path to the pretrained LLM model.
+            device (str): The computational device (e.g., 'cpu' or 'cuda').
+            batch_size (int): Number of samples to process in each batch.
+            max_length (int): Maximum input sequence length for the LLM.
+            max_new_tokens (int): Maximum tokens to generate for each sequence.
+            llm_threshold (float): Threshold for the postprocessor to filter results.
 
         Returns:
-            dict or None: Evaluation report if `evaluate` is True. Matching results if `return_matching` is True.
+            dict: The resulting matchings after encoding, LLM generation, and processing.
         """
         encoder_output = encoder_model(source=self.dataset['source'], target=self.dataset['target'])
         llm_dataset = dataset_class(source_onto=encoder_output[0], target_onto=encoder_output[1])
         dataloader = DataLoader(llm_dataset, batch_size=batch_size, shuffle=False, collate_fn=llm_dataset.collate_fn)
         model = model_class(device=device, max_length=max_length, max_new_tokens=max_new_tokens)
         model.load(path=llm_path)
-        matchings = model.generate(input_data=dataloader)
-        matchings = postprocessor(matchings)
-        return self._process_results(matchings, "llm", evaluate, return_matching)
 
-    def _run_rag(self):
-        return
+        matchings = []
+        for batch in tqdm(dataloader):
+            sequences = model.generate(batch["prompts"])
+            matchings.extend(sequences)
+
+        matchings = postprocessor(predicts=matchings, mapper=llm_mapper, dataset=llm_dataset,
+                                  interested_class=llm_mapper_interested_class)
+        return matchings
 
-    def _run_fewshot_rag(self):
-        return
+    def _run_rag(self, method, encoder_model, model_class, postprocessor, llm_threshold, ir_threshold, retriever_path,
+                 llm_path, rag_config):
+        """
+        Executes the RAG (Retriever-Augmented Generation) ontology alignment method.
+
+        This method combines retriever-based and LLM-based techniques to generate
+        ontology matchings. A retriever identifies candidate matches, and an LLM
+        refines the results. The final matchings are postprocessed to meet thresholds.
 
-    def _run_icv_rag(self):
-        return
+        Parameters:
+            method (str): Specific RAG method to use (e.g., 'icv-rag', 'fewshot-rag').
+            encoder_model (BaseEncoder): Encoder model to encode the ontologies.
+            model_class (BaseOMModel): A class implementing RAG-based matching logic.
+            postprocessor (callable): A function to refine the matching results.
+            llm_threshold (float): Confidence threshold for the LLM-based predictions.
+            ir_threshold (float): Score threshold for the retriever results.
+            retriever_path (str): File path to the retriever model.
+            llm_path (str): File path to the LLM model.
+            rag_config (dict): Configuration parameters for the RAG model.
 
-    def _process_results(self, matchings, method, evaluate, return_matching):
+        Returns:
+            dict: The resulting matchings after encoding, RAG generation, and processing.
+        """
+        encoder_output = encoder_model(source=self.dataset['source'],
+                                       target=self.dataset['target'],
+                                       reference=self.dataset[
+                                           'reference'] if method == 'icv-rag' or method == 'fewshot-rag' else None)
+        model = model_class(**rag_config)
+        model.load(llm_path=llm_path, ir_path=retriever_path)
+        matchings = model.generate(input_data=encoder_output)
+        matchings, _ = postprocessor(matchings, ir_score_threshold=ir_threshold, llm_confidence_th=llm_threshold)
+        return matchings
+
+    def _process_results(self, matchings, method, evaluate, return_matching, output_file_name, save_matchings):
         """
         Processes and evaluates the matching results.
 
@@ -187,29 +267,38 @@ def _process_results(self, matchings, method, evaluate, return_matching):
             method (str): The method used for alignment.
             evaluate (bool): Whether to evaluate the results.
             return_matching (bool): Whether to return the matching results.
+            output_file_name (str): Output file name.
+            save_matchings (bool, optional):  Whether to save the matching in results or not.
 
         Returns:
             dict or None: Evaluation report if `evaluate` is True. Matching results if `return_matching` is True.
         """
-        output_dir = self.output_path / method
-        output_dir.mkdir(parents=True, exist_ok=True)
-
+        output_matches = None
         if self.output_format == "xml":
             xml_str = xmlify.xml_alignment_generator(matchings=matchings)
-            with open(output_dir / "matchings.xml", "w", encoding="utf-8") as xml_file:
-                xml_file.write(xml_str)
+            output_matches = xml_str
         elif self.output_format == "json":
-            with open(output_dir / "matchings.json", "w", encoding="utf-8") as json_file:
-                json.dump(matchings, json_file, indent=4, ensure_ascii=False)
+            output_matches = matchings
         else:
             raise ValueError("Unsupported output format")
 
+        if save_matchings:
+            output_dir = self.output_dir / method
+            output_dir.mkdir(parents=True, exist_ok=True)
+            if self.output_format == "xml":
+                with open(output_dir / f"{output_file_name}.xml", "w", encoding="utf-8") as xml_file:
+                    xml_file.write(output_matches)
+            elif self.output_format == "json":
+                with open(output_dir / f"{output_file_name}.json", "w", encoding="utf-8") as json_file:
+                    json.dump(output_matches, json_file, indent=4, ensure_ascii=False)
+
         evaluation = None
         if evaluate:
             evaluation = metrics.evaluation_report(predicts=matchings, references=self.dataset['reference'])
-            print(f"{method.capitalize()} Evaluation Report:", json.dumps(evaluation, indent=4))
 
         if return_matching:
-            return matchings
-
-        return evaluation
+            if evaluate:
+                return matchings, evaluation
+            return output_matches
+        if evaluate:
+            return evaluation