From dbbd4f5f08e3c823b3d549f5b166918e15d120b7 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 15 Nov 2024 02:31:20 -0800
Subject: [PATCH 01/42] Initial commit for RAG pipeline scripts

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/.gitignore    |  12 +
 .../ml_commons/rag_pipeline/rag/ingest.py     | 194 +++++++
 .../rag_pipeline/rag/opensearch_class.py      | 127 +++++
 .../ml_commons/rag_pipeline/rag/query.py      | 187 +++++++
 .../ml_commons/rag_pipeline/rag/rag.py        |  69 +++
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 486 ++++++++++++++++++
 .../rag_pipeline/rag/requirements.txt         |   9 +
 .../ml_commons/rag_pipeline/rag/setup.py      |  15 +
 8 files changed, 1099 insertions(+)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
 create mode 100755 opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
new file mode 100644
index 00000000..801d43ba
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
@@ -0,0 +1,12 @@
+# Ignore data and ingestion directories
+ml_commons/rag_pipeline/data/
+ml_commons/rag_pipeline/ingestion/
+ml_commons/rag_pipeline/rag/config.ini
+# Ignore virtual environment
+.venv/
+# Or, specify the full path
+/Users/hmumtazz/.cursor-tutor/opensearch-py-ml/.venv/
+
+# Ignore Python cache files
+__pycache__/
+*.pyc
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
new file mode 100644
index 00000000..9bcfb316
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -0,0 +1,194 @@
+# ingest_class.py
+
+import os
+import glob
+import json
+import tiktoken
+from tqdm import tqdm
+from colorama import Fore, Style, init
+from typing import List, Dict
+import csv
+import PyPDF2
+import boto3
+import botocore
+import time
+import random
+
+
+from opensearch_class import OpenSearchClass
+
+init(autoreset=True)  # Initialize colorama
+
+class IngestClass:
+    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v1'
+
+    def __init__(self, config):
+        self.config = config
+        self.aws_region = config.get('region')
+        self.index_name = config.get('index_name')
+        self.bedrock_client = None
+        self.opensearch = OpenSearchClass(config)
+
+    def initialize_clients(self):
+        try:
+            self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+            if self.opensearch.initialize_opensearch_client():
+                print("Clients initialized successfully.")
+                return True
+            else:
+                print("Failed to initialize OpenSearch client.")
+                return False
+        except Exception as e:
+            print(f"Failed to initialize clients: {e}")
+            return False
+
+    def process_file(self, file_path: str) -> List[Dict[str, str]]:
+        _, file_extension = os.path.splitext(file_path)
+        
+        if file_extension.lower() == '.csv':
+            return self.process_csv(file_path)
+        elif file_extension.lower() == '.txt':
+            return self.process_txt(file_path)
+        elif file_extension.lower() == '.pdf':
+            return self.process_pdf(file_path)
+        else:
+            print(f"Unsupported file type: {file_extension}")
+            return []
+
+    def process_csv(self, file_path: str) -> List[Dict[str, str]]:
+        documents = []
+        with open(file_path, 'r') as csvfile:
+            reader = csv.DictReader(csvfile)
+            for row in reader:
+                text = f"{row['name']} got nominated under the category, {row['category']}, for the film {row['film']}"
+                if row.get('winner', '').lower() != 'true':
+                    text += " but did not win"
+                documents.append({"text": text})
+        return documents
+
+    def process_txt(self, file_path: str) -> List[Dict[str, str]]:
+        with open(file_path, 'r') as txtfile:
+            content = txtfile.read()
+        return [{"text": content}]
+
+    def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
+        documents = []
+        with open(file_path, 'rb') as pdffile:
+            pdf_reader = PyPDF2.PdfReader(pdffile)
+            for page in pdf_reader.pages:
+                extracted_text = page.extract_text()
+                if extracted_text:  # Ensure that text was extracted
+                    documents.append({"text": extracted_text})
+        return documents
+
+    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        if self.bedrock_client is None:
+            print("Bedrock client is not initialized. Please run setup first.")
+            return None
+        
+        delay = initial_delay
+        for attempt in range(max_retries):
+            try:
+                payload = {"inputText": text}
+                response = self.bedrock_client.invoke_model(modelId=self.EMBEDDING_MODEL_ID, body=json.dumps(payload))
+                response_body = json.loads(response['body'].read())
+                embedding = response_body.get('embedding')
+                if embedding is None:
+                    print(f"No embedding returned for text: {text}")
+                    print(f"Response body: {response_body}")
+                    return None
+                return embedding
+            except botocore.exceptions.ClientError as e:
+                error_code = e.response['Error']['Code']
+                error_message = e.response['Error']['Message']
+                print(f"ClientError on attempt {attempt + 1}: {error_code} - {error_message}")
+                if error_code == 'ThrottlingException':
+                    if attempt == max_retries - 1:
+                        raise
+                    time.sleep(delay + random.uniform(0, 1))
+                    delay *= backoff_factor
+                else:
+                    raise
+            except Exception as ex:
+                print(f"Unexpected error on attempt {attempt + 1}: {ex}")
+                if attempt == max_retries - 1:
+                    raise
+        return None
+
+    def process_and_ingest_data(self, file_paths: List[str]):
+        if not self.initialize_clients():
+            print("Failed to initialize clients. Aborting ingestion.")
+            return
+
+        all_documents = []
+        for file_path in file_paths:
+            print(f"Processing file: {file_path}")
+            documents = self.process_file(file_path)
+            all_documents.extend(documents)
+        
+        total_documents = len(all_documents)
+        print(f"Total documents to process: {total_documents}")
+        
+        print("Generating embeddings for the documents...")
+        success_count = 0
+        error_count = 0
+        with tqdm(total=total_documents, bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]') as pbar:
+            for doc in all_documents:
+                try:
+                    embedding = self.text_embedding(doc['text'])
+                    if embedding is not None:
+                        doc['embedding'] = embedding
+                        success_count += 1
+                    else:
+                        error_count += 1
+                        print(f"{Fore.RED}Error generating embedding for document: {doc['text'][:50]}...{Style.RESET_ALL}")
+                except Exception as e:
+                    error_count += 1
+                    print(f"{Fore.RED}Error processing document: {str(e)}{Style.RESET_ALL}")
+                pbar.update(1)
+                pbar.set_postfix({'Success': success_count, 'Errors': error_count})
+        
+        print(f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}")
+        print(f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}")
+        
+        if success_count == 0:
+            print(f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}")
+            return
+        
+        print(f"{Fore.YELLOW}Ingesting data into OpenSearch...{Style.RESET_ALL}")
+        actions = []
+        for doc in all_documents:
+            if 'embedding' in doc and doc['embedding'] is not None:
+                action = {
+                    "_index": self.index_name,
+                    "_source": {
+                        "nominee_text": doc['text'],
+                        "nominee_vector": doc['embedding']
+                    }
+                }
+                actions.append(action)
+        
+        success, failed = self.opensearch.bulk_index(actions)
+        print(f"{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
+        print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
+
+    def ingest_command(self, paths: List[str]):
+        all_files = []
+        for path in paths:
+            if os.path.isfile(path):
+                all_files.append(path)
+            elif os.path.isdir(path):
+                all_files.extend(glob.glob(os.path.join(path, '*')))
+            else:
+                print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
+        
+        supported_extensions = ['.csv', '.txt', '.pdf']
+        valid_files = [f for f in all_files if any(f.lower().endswith(ext) for ext in supported_extensions)]
+        
+        if not valid_files:
+            print(f"{Fore.RED}No valid files found for ingestion.{Style.RESET_ALL}")
+            return
+        
+        print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
+        
+        self.process_and_ingest_data(valid_files)
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py
new file mode 100644
index 00000000..eca4619c
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py
@@ -0,0 +1,127 @@
+# opensearch_class.py
+
+from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth, exceptions as opensearch_exceptions
+import boto3
+from urllib.parse import urlparse
+from opensearchpy import helpers as opensearch_helpers
+
+class OpenSearchClass:
+    def __init__(self, config):
+        self.config = config
+        self.opensearch_client = None
+        self.aws_region = config.get('region')
+        self.index_name = config.get('index_name')
+        self.is_serverless = config.get('is_serverless', 'False') == 'True'
+        self.opensearch_endpoint = config.get('opensearch_endpoint')
+        self.opensearch_username = config.get('opensearch_username')
+        self.opensearch_password = config.get('opensearch_password')
+
+    def initialize_opensearch_client(self):
+        if not self.opensearch_endpoint:
+            print("OpenSearch endpoint not set. Please run setup first.")
+            return False
+        
+        parsed_url = urlparse(self.opensearch_endpoint)
+        host = parsed_url.hostname
+        port = parsed_url.port or 443
+
+        if self.is_serverless:
+            credentials = boto3.Session().get_credentials()
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+        else:
+            if not self.opensearch_username or not self.opensearch_password:
+                print("OpenSearch username or password not set. Please run setup first.")
+                return False
+            auth = (self.opensearch_username, self.opensearch_password)
+
+        try:
+            self.opensearch_client = OpenSearch(
+                hosts=[{'host': host, 'port': port}],
+                http_auth=auth,
+                use_ssl=True,
+                verify_certs=True,
+                connection_class=RequestsHttpConnection,
+                pool_maxsize=20
+            )
+            print(f"Initialized OpenSearch client with host: {host} and port: {port}")
+            return True
+        except Exception as ex:
+            print(f"Error initializing OpenSearch client: {ex}")
+            return False
+
+    def create_index(self, embedding_dimension, space_type):
+        index_body = {
+            "mappings": {
+                "properties": {
+                    "nominee_text": {"type": "text"},
+                    "nominee_vector": {
+                        "type": "knn_vector",
+                        "dimension": embedding_dimension,
+                        "method": {
+                            "name": "hnsw",
+                            "space_type": space_type,
+                            "engine": "nmslib",
+                            "parameters": {"ef_construction": 512, "m": 16},
+                        },
+                    },
+                }
+            },
+            "settings": {
+                "index": {
+                    "number_of_shards": 2,
+                    "knn.algo_param": {"ef_search": 512},
+                    "knn": True,
+                }
+            },
+        }
+        try:
+            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
+            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
+        except opensearch_exceptions.RequestError as e:
+            if 'resource_already_exists_exception' in str(e).lower():
+                print(f"Index '{self.index_name}' already exists.")
+            else:
+                print(f"Error creating index '{self.index_name}': {e}")
+
+    def verify_and_create_index(self, embedding_dimension, space_type):
+        try:
+            index_exists = self.opensearch_client.indices.exists(index=self.index_name)
+            if index_exists:
+                print(f"KNN index '{self.index_name}' already exists.")
+            else:
+                self.create_index(embedding_dimension, space_type)
+            return True
+        except Exception as ex:
+            print(f"Error verifying or creating index: {ex}")
+            return False
+
+    def bulk_index(self, actions):
+        try:
+            success, failed = opensearch_helpers.bulk(self.opensearch_client, actions)
+            print(f"Indexed {success} documents successfully. Failed to index {failed} documents.")
+            return success, failed
+        except Exception as e:
+            print(f"Error during bulk indexing: {e}")
+            return 0, len(actions)
+
+    def search(self, vector, k=5):
+        try:
+            response = self.opensearch_client.search(
+                index=self.index_name,
+                body={
+                    "size": k,
+                    "_source": ["nominee_text"],
+                    "query": {
+                        "knn": {
+                            "nominee_vector": {
+                                "vector": vector,
+                                "k": k
+                            }
+                        }
+                    }
+                }
+            )
+            return response['hits']['hits']
+        except Exception as e:
+            print(f"Error during search: {e}")
+            return []
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
new file mode 100644
index 00000000..d4305c90
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -0,0 +1,187 @@
+# query_class.py
+
+import json
+import tiktoken
+from colorama import Fore, Style, init
+from typing import List
+import boto3
+import botocore
+import time
+import random
+from opensearch_class import OpenSearchClass
+
+init(autoreset=True)  # Initialize colorama
+
+class QueryClass:
+    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v1'
+    LLM_MODEL_ID = 'amazon.titan-text-express-v1'
+
+    def __init__(self, config):
+        self.config = config
+        self.aws_region = config.get('region')
+        self.index_name = config.get('index_name')
+        self.bedrock_client = None
+        self.opensearch = OpenSearchClass(config)
+
+    def initialize_clients(self):
+        try:
+            self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+            if self.opensearch.initialize_opensearch_client():
+                print("Clients initialized successfully.")
+                return True
+            else:
+                print("Failed to initialize OpenSearch client.")
+                return False
+        except Exception as e:
+            print(f"Failed to initialize clients: {e}")
+            return False
+
+    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        if self.bedrock_client is None:
+            print("Bedrock client is not initialized. Please run setup first.")
+            return None
+        
+        delay = initial_delay
+        for attempt in range(max_retries):
+            try:
+                payload = {"inputText": text}
+                response = self.bedrock_client.invoke_model(modelId=self.EMBEDDING_MODEL_ID, body=json.dumps(payload))
+                response_body = json.loads(response['body'].read())
+                embedding = response_body.get('embedding')
+                if embedding is None:
+                    print(f"No embedding returned for text: {text}")
+                    print(f"Response body: {response_body}")
+                    return None
+                return embedding
+            except botocore.exceptions.ClientError as e:
+                error_code = e.response['Error']['Code']
+                error_message = e.response['Error']['Message']
+                print(f"ClientError on attempt {attempt + 1}: {error_code} - {error_message}")
+                if error_code == 'ThrottlingException':
+                    if attempt == max_retries - 1:
+                        raise
+                    time.sleep(delay + random.uniform(0, 1))
+                    delay *= backoff_factor
+                else:
+                    raise
+            except Exception as ex:
+                print(f"Unexpected error on attempt {attempt + 1}: {ex}")
+                if attempt == max_retries - 1:
+                    raise
+        return None
+
+    def bulk_query(self, queries, k=5):
+        print("Generating embeddings for queries...")
+        query_vectors = []
+        for query in queries:
+            embedding = self.text_embedding(query)
+            if embedding:
+                query_vectors.append(embedding)
+            else:
+                print(f"{Fore.RED}Failed to generate embedding for query: {query}{Style.RESET_ALL}")
+                query_vectors.append(None)
+        
+        print("Performing bulk semantic search...")
+        results = []
+        for i, vector in enumerate(query_vectors):
+            if vector is None:
+                results.append({
+                    'query': queries[i],
+                    'context': "",
+                    'num_results': 0
+                })
+                continue
+            try:
+                hits = self.opensearch.search(vector, k)
+                context = '\n'.join([hit['_source']['nominee_text'] for hit in hits])
+                results.append({
+                    'query': queries[i],
+                    'context': context,
+                    'num_results': len(hits)
+                })
+            except Exception as ex:
+                print(f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}")
+                results.append({
+                    'query': queries[i],
+                    'context': "",
+                    'num_results': 0
+                })
+        
+        return results
+
+    def generate_answer(self, prompt, config):
+        try:
+            max_input_tokens = 8192  # Max tokens for the model
+            expected_output_tokens = config.get('maxTokenCount', 1000)
+            encoding = tiktoken.get_encoding("cl100k_base")  # Use appropriate encoding
+
+            prompt_tokens = encoding.encode(prompt)
+            allowable_input_tokens = max_input_tokens - expected_output_tokens
+
+            if len(prompt_tokens) > allowable_input_tokens:
+                # Truncate the prompt to fit within the model's token limit
+                prompt_tokens = prompt_tokens[:allowable_input_tokens]
+                prompt = encoding.decode(prompt_tokens)
+                print(f"Prompt truncated to {allowable_input_tokens} tokens.")
+
+            # Simplified LLM config with only supported parameters
+            llm_config = {
+                'maxTokenCount': expected_output_tokens,
+                'temperature': config.get('temperature', 0.7),
+                'topP': config.get('topP', 1.0),
+                'stopSequences': config.get('stopSequences', [])
+            }
+
+            body = json.dumps({
+                'inputText': prompt,
+                'textGenerationConfig': llm_config
+            })
+            response = self.bedrock_client.invoke_model(modelId=self.LLM_MODEL_ID, body=body)
+            response_body = json.loads(response['body'].read())
+            results = response_body.get('results', [])
+            if not results:
+                print("No results returned from LLM.")
+                return None
+            answer = results[0].get('outputText', '').strip()
+            return answer
+        except Exception as ex:
+            print(f"Error generating answer from LLM: {ex}")
+            return None
+
+    def query_command(self, queries: List[str], num_results=5):
+        if not self.initialize_clients():
+            print("Failed to initialize clients. Aborting query.")
+            return
+        
+        results = self.bulk_query(queries, k=num_results)
+        
+        llm_config = {
+            "maxTokenCount": 1000,
+            "temperature": 0.7,
+            "topP": 0.9,
+            "stopSequences": []
+        }
+        
+        for result in results:
+            print(f"\nQuery: {result['query']}")
+            print(f"Found {result['num_results']} results.")
+            
+            if not result['context']:
+                print(f"{Fore.RED}No context available for this query.{Style.RESET_ALL}")
+                continue
+            
+            augmented_prompt = f"""Context: {result['context']}
+Based on the above context, please provide a detailed and insightful answer to the following question. Feel free to make reasonable inferences or connections if the context doesn't provide all the information:
+
+Question: {result['query']}
+
+Answer:"""
+        
+            print("Generating answer using LLM...")
+            answer = self.generate_answer(augmented_prompt, llm_config)
+        
+            if answer:
+                print("Generated Answer:")
+                print(answer)
+            else:
+                print("Failed to generate an answer.")
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
new file mode 100755
index 00000000..80f57875
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -0,0 +1,69 @@
+#!/usr/bin/env python3
+
+"""
+Main CLI script for OpenSearch with Bedrock Integration
+"""
+
+import argparse
+import configparser
+from rag_setup import SetupClass
+from ingest import IngestClass
+from query import QueryClass
+
+CONFIG_FILE = 'config.ini'
+
+def load_config():
+    config = configparser.ConfigParser()
+    config.read(CONFIG_FILE)
+    return config['DEFAULT']
+
+def save_config(config):
+    parser = configparser.ConfigParser()
+    parser['DEFAULT'] = config
+    with open(CONFIG_FILE, 'w') as f:
+        parser.write(f)
+    
+def main():
+    parser = argparse.ArgumentParser(description="RAG Pipeline CLI")
+    parser.add_argument('command', choices=['setup', 'ingest', 'query'], help='Command to run')
+    parser.add_argument('--paths', nargs='+', help='Paths to files or directories for ingestion')
+    parser.add_argument('--queries', nargs='+', help='Query texts for search and answer generation')
+    parser.add_argument('--num_results', type=int, default=5, help='Number of top results to retrieve for each query')
+
+    args = parser.parse_args()
+
+    config = load_config()
+
+    if args.command == 'setup':
+        setup = SetupClass()
+        setup.setup_command()
+        save_config(setup.config)
+    elif args.command == 'ingest':
+        if not args.paths:
+            paths = []
+            while True:
+                path = input("Enter a file or directory path (or press Enter to finish): ")
+                if not path:
+                    break
+                paths.append(path)
+        else:
+            paths = args.paths
+        ingest = IngestClass(config)
+        ingest.ingest_command(paths)
+    elif args.command == 'query':
+        if not args.queries:
+            queries = []
+            while True:
+                query = input("Enter a query (or press Enter to finish): ")
+                if not query:
+                    break
+                queries.append(query)
+        else:
+            queries = args.queries
+        query = QueryClass(config)
+        query.query_command(queries, num_results=args.num_results)
+    else:
+        parser.print_help()
+
+if __name__ == "__main__":
+    main()
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
new file mode 100644
index 00000000..47c03b9e
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -0,0 +1,486 @@
+# setup_class.py
+import boto3
+import botocore
+from botocore.config import Config
+import configparser
+import subprocess
+import os
+import json
+import time
+import termios
+import tty
+import sys
+from urllib.parse import urlparse
+from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
+
+class SetupClass:
+    CONFIG_FILE = 'config.ini'
+    SERVICE_AOSS = 'opensearchserverless'
+    SERVICE_BEDROCK = 'bedrock-runtime'
+
+    def __init__(self):
+        self.aws_region = None
+        self.iam_principal = None
+        self.index_name = None
+        self.collection_name = None
+        self.opensearch_endpoint = None
+        self.is_serverless = None
+        self.opensearch_username = None
+        self.opensearch_password = None
+        self.aoss_client = None
+        self.bedrock_client = None
+        self.opensearch_client = None
+
+    def check_and_configure_aws(self):
+        try:
+            session = boto3.Session()
+            credentials = session.get_credentials()
+
+            if credentials is None:
+                print("AWS credentials are not configured.")
+                self.configure_aws()
+            else:
+                print("AWS credentials are already configured.")
+                reconfigure = input("Do you want to reconfigure? (yes/no): ").lower()
+                if reconfigure == 'yes':
+                    self.configure_aws()
+        except Exception as e:
+            print(f"An error occurred while checking AWS credentials: {e}")
+            self.configure_aws()
+
+    def configure_aws(self):
+        print("Let's configure your AWS credentials.")
+
+        aws_access_key_id = input("Enter your AWS Access Key ID: ")
+        aws_secret_access_key = input("Enter your AWS Secret Access Key: ")
+        aws_region_input = input("Enter your preferred AWS region (e.g., us-west-2): ")
+
+        try:
+            subprocess.run([
+                'aws', 'configure', 'set', 
+                'aws_access_key_id', aws_access_key_id
+            ], check=True)
+            
+            subprocess.run([
+                'aws', 'configure', 'set', 
+                'aws_secret_access_key', aws_secret_access_key
+            ], check=True)
+            
+            subprocess.run([
+                'aws', 'configure', 'set', 
+                'region', aws_region_input
+            ], check=True)
+            
+            print("AWS credentials have been successfully configured.")
+        except subprocess.CalledProcessError as e:
+            print(f"An error occurred while configuring AWS credentials: {e}")
+        except Exception as e:
+            print(f"An unexpected error occurred: {e}")
+
+    def load_config(self):
+        config = configparser.ConfigParser()
+        if os.path.exists(self.CONFIG_FILE):
+            config.read(self.CONFIG_FILE)
+            return dict(config['DEFAULT'])
+        return {}
+
+
+    def save_config(self, config):
+        parser = configparser.ConfigParser()
+        parser['DEFAULT'] = config
+        with open(self.CONFIG_FILE, 'w') as f:
+            parser.write(f)
+
+    def get_password_with_asterisks(self, prompt="Enter password: "):  # Accept 'prompt'
+        import sys
+        if sys.platform == 'win32':
+            import msvcrt
+            print(prompt, end='', flush=True)
+            password = ""
+            while True:
+                key = msvcrt.getch()
+                if key == b'\r':  # Enter key
+                    sys.stdout.write('\n')
+                    return password
+                elif key == b'\x08':  # Backspace key
+                    if len(password) > 0:
+                        password = password[:-1]
+                        sys.stdout.write('\b \b')  # Erase the last asterisk
+                        sys.stdout.flush()
+                else:
+                    password += key.decode('utf-8')
+                    sys.stdout.write('*')  # Mask input with '*'
+                    sys.stdout.flush()
+        else:
+            import termios, tty
+            fd = sys.stdin.fileno()
+            old_settings = termios.tcgetattr(fd)
+            try:
+                tty.setraw(fd)
+                sys.stdout.write(prompt)
+                sys.stdout.flush()
+                password = ""
+                while True:
+                    ch = sys.stdin.read(1)
+                    if ch in ('\r', '\n'):  # Enter key
+                        sys.stdout.write('\n')
+                        return password
+                    elif ch == '\x7f':  # Backspace key
+                        if len(password) > 0:
+                            password = password[:-1]
+                            sys.stdout.write('\b \b')  # Erase the last asterisk
+                            sys.stdout.flush()
+                    else:
+                        password += ch
+                        sys.stdout.write('*')  # Mask input with '*'
+                        sys.stdout.flush()
+            finally:
+                termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
+
+    def setup_configuration(self):
+        config = self.load_config()
+
+        self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
+        self.iam_principal = input(f"Enter your IAM Principal ARN [{config.get('iam_principal', '')}]: ") or config.get('iam_principal', '')
+
+        service_type = input("Choose OpenSearch service type (1 for Serverless, 2 for Managed): ")
+        self.is_serverless = service_type == '1'
+
+        if self.is_serverless:
+            self.index_name = input("Enter a name for your KNN index in OpenSearch: ")
+            self.collection_name = input("Enter the name for your OpenSearch collection: ")
+            self.opensearch_endpoint = None
+            self.opensearch_username = None
+            self.opensearch_password = None
+        else:
+            self.index_name = input("Enter a name for your KNN index in OpenSearch: ")
+            self.opensearch_endpoint = input("Enter your OpenSearch domain endpoint: ")
+            self.opensearch_username = input("Enter your OpenSearch username: ")
+            self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
+            self.collection_name = ''
+
+        self.config = {
+            'region': self.aws_region,
+            'iam_principal': self.iam_principal,
+            'index_name': self.index_name,
+            'collection_name': self.collection_name if self.collection_name else '',
+            'is_serverless': str(self.is_serverless),
+            'opensearch_endpoint': self.opensearch_endpoint if self.opensearch_endpoint else '',
+            'opensearch_username': self.opensearch_username if self.opensearch_username else '',
+            'opensearch_password': self.opensearch_password if self.opensearch_password else ''
+        }
+        self.save_config(self.config)
+        print("Configuration saved successfully.")
+
+    def initialize_clients(self):
+        try:
+            boto_config = Config(
+                region_name=self.aws_region,
+                signature_version='v4',
+                retries={'max_attempts': 10, 'mode': 'standard'}
+            )
+            if self.is_serverless:
+                self.aoss_client = boto3.client(self.SERVICE_AOSS, config=boto_config)
+            self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region)
+            
+            time.sleep(7)
+            print("AWS clients initialized successfully.")
+            return True
+        except Exception as e:
+            print(f"Failed to initialize AWS clients: {e}")
+            return False
+
+    def create_security_policies(self):
+        if not self.is_serverless:
+            print("Security policies are not applicable for managed OpenSearch domains.")
+            return
+        
+        encryption_policy = json.dumps({
+            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
+            "AWSOwnedKey": True
+        })
+        
+        network_policy = json.dumps([{
+            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
+            "AllowFromPublic": True
+        }])
+        
+        data_access_policy = json.dumps([{
+            "Rules": [
+                {"Resource": ["collection/*"], "Permission": ["aoss:*"], "ResourceType": "collection"},
+                {"Resource": ["index/*/*"], "Permission": ["aoss:*"], "ResourceType": "index"}
+            ],
+            "Principal": [self.iam_principal],
+            "Description": f"Data access policy for {self.collection_name}"
+        }])
+        
+        encryption_policy_name = self.get_truncated_name(f"{self.collection_name}-enc-policy")
+        self.create_security_policy("encryption", encryption_policy_name, f"{self.collection_name} encryption security policy", encryption_policy)
+        self.create_security_policy("network", f"{self.collection_name}-net-policy", f"{self.collection_name} network security policy", network_policy)
+        self.create_access_policy(self.get_truncated_name(f"{self.collection_name}-access-policy"), f"{self.collection_name} data access policy", data_access_policy)
+
+    def create_security_policy(self, policy_type, name, description, policy_body):
+        try:
+            if policy_type.lower() == "encryption":
+                self.aoss_client.create_security_policy(description=description, name=name, policy=policy_body, type="encryption")
+            elif policy_type.lower() == "network":
+                self.aoss_client.create_security_policy(description=description, name=name, policy=policy_body, type="network")
+            else:
+                raise ValueError("Invalid policy type specified.")
+            print(f"{policy_type.capitalize()} Policy '{name}' created successfully.")
+        except self.aoss_client.exceptions.ConflictException:
+            print(f"{policy_type.capitalize()} Policy '{name}' already exists.")
+        except Exception as ex:
+            print(f"Error creating {policy_type} policy '{name}': {ex}")
+
+    def create_access_policy(self, name, description, policy_body):
+        try:
+            self.aoss_client.create_access_policy(description=description, name=name, policy=policy_body, type="data")
+            print(f"Data Access Policy '{name}' created successfully.")
+        except self.aoss_client.exceptions.ConflictException:
+            print(f"Data Access Policy '{name}' already exists.")
+        except Exception as ex:
+            print(f"Error creating data access policy '{name}': {ex}")
+
+    def create_collection(self, collection_name, max_retries=3):
+        for attempt in range(max_retries):
+            try:
+                response = self.aoss_client.create_collection(
+                    description=f"{collection_name} collection",
+                    name=collection_name,
+                    type="VECTORSEARCH"
+                )
+                print(f"Collection '{collection_name}' creation initiated.")
+                return response['createCollectionDetail']['id']
+            except self.aoss_client.exceptions.ConflictException:
+                print(f"Collection '{collection_name}' already exists.")
+                return self.get_collection_id(collection_name)
+            except Exception as ex:
+                print(f"Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}")
+                if attempt == max_retries - 1:
+                    return None
+                time.sleep(5)
+        return None
+
+    def get_collection_id(self, collection_name):
+        try:
+            response = self.aoss_client.list_collections()
+            for collection in response['collectionSummaries']:
+                if collection['name'] == collection_name:
+                    return collection['id']
+        except Exception as ex:
+            print(f"Error getting collection ID: {ex}")
+        return None
+
+    def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
+        print(f"Waiting for collection '{self.collection_name}' to become active...")
+        start_time = time.time()
+        while time.time() - start_time < max_wait_minutes * 60:
+            try:
+                response = self.aoss_client.batch_get_collection(ids=[collection_id])
+                status = response['collectionDetails'][0]['status']
+                if status == 'ACTIVE':
+                    print(f"Collection '{self.collection_name}' is now active.")
+                    return True
+                elif status in ['FAILED', 'DELETED']:
+                    print(f"Collection creation failed or was deleted. Status: {status}")
+                    return False
+                else:
+                    print(f"Collection status: {status}. Waiting...")
+                    time.sleep(30)
+            except Exception as ex:
+                print(f"Error checking collection status: {ex}")
+                time.sleep(30)
+        print(f"Timed out waiting for collection to become active after {max_wait_minutes} minutes.")
+        return False
+
+    def get_collection_endpoint(self):
+        if not self.is_serverless:
+            return self.opensearch_endpoint
+        
+        try:
+            collection_id = self.get_collection_id(self.collection_name)
+            if not collection_id:
+                print(f"Collection '{self.collection_name}' not found.")
+                return None
+            
+            batch_get_response = self.aoss_client.batch_get_collection(ids=[collection_id])
+            collection_details = batch_get_response.get('collectionDetails', [])
+            
+            if not collection_details:
+                print(f"No details found for collection ID '{collection_id}'.")
+                return None
+            
+            self.opensearch_endpoint = collection_details[0].get('collectionEndpoint')
+            if self.opensearch_endpoint:
+                print(f"Collection '{self.collection_name}' has endpoint URL: {self.opensearch_endpoint}")
+                return self.opensearch_endpoint
+            else:
+                print(f"No endpoint URL found in collection '{self.collection_name}'.")
+                return None
+        except Exception as ex:
+            print(f"Error retrieving collection endpoint: {ex}")
+            return None
+
+    def initialize_opensearch_client(self):
+        if not self.opensearch_endpoint:
+            print("OpenSearch endpoint not set. Please run setup first.")
+            return False
+        
+        parsed_url = urlparse(self.opensearch_endpoint)
+        host = parsed_url.hostname
+        port = parsed_url.port or 443
+
+        if self.is_serverless:
+            credentials = boto3.Session().get_credentials()
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+        else:
+            if not self.opensearch_username or not self.opensearch_password:
+                print("OpenSearch username or password not set. Please run setup first.")
+                return False
+            auth = (self.opensearch_username, self.opensearch_password)
+
+        try:
+            self.opensearch_client = OpenSearch(
+                hosts=[{'host': host, 'port': port}],
+                http_auth=auth,
+                use_ssl=True,
+                verify_certs=True,
+                connection_class=RequestsHttpConnection,
+                pool_maxsize=20
+            )
+            print(f"Initialized OpenSearch client with host: {host} and port: {port}")
+            return True
+        except Exception as ex:
+            print(f"Error initializing OpenSearch client: {ex}")
+            return False
+
+    def get_knn_index_details(self):
+        # Simplified dimension input
+        dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ")
+        
+        if dimension_input.strip() == "":
+            embedding_dimension = 768
+        else:
+            try:
+                embedding_dimension = int(dimension_input)
+            except ValueError:
+                print("Invalid input. Using default dimension of 768.")
+                embedding_dimension = 768
+
+        print(f"\nEmbedding dimension set to: {embedding_dimension}")
+
+        # Space type selection
+        print("\nChoose the space type for KNN:")
+        print("1. L2 (Euclidean distance)")
+        print("2. Cosine similarity")
+        print("3. Inner product")
+        space_choice = input("Enter your choice (1-3), or press Enter for default (L2): ")
+
+        if space_choice == "" or space_choice == "1":
+            space_type = "l2"
+        elif space_choice == "2":
+            space_type = "cosinesimil"
+        elif space_choice == "3":
+            space_type = "innerproduct"
+        else:
+            print("Invalid choice. Using default space type of L2 (Euclidean distance).")
+            space_type = "l2"
+
+        print(f"Space type set to: {space_type}")
+
+        return embedding_dimension, space_type
+
+
+    def create_index(self, embedding_dimension, space_type):
+        index_body = {
+            "mappings": {
+                "properties": {
+                    "nominee_text": {"type": "text"},
+                    "nominee_vector": {
+                        "type": "knn_vector",
+                        "dimension": embedding_dimension,
+                        "method": {
+                            "name": "hnsw",
+                            "space_type": space_type,
+                            "engine": "nmslib",
+                            "parameters": {"ef_construction": 512, "m": 16},
+                        },
+                    },
+                }
+            },
+            "settings": {
+                "index": {
+                    "number_of_shards": 2,
+                    "knn.algo_param": {"ef_search": 512},
+                    "knn": True,
+                }
+            },
+        }
+        try:
+            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
+            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
+        except Exception as e:
+            if 'resource_already_exists_exception' in str(e).lower():
+                print(f"Index '{self.index_name}' already exists.")
+            else:
+                print(f"Error creating index '{self.index_name}': {e}")
+
+    def verify_and_create_index(self, embedding_dimension, space_type):
+        try:
+            index_exists = self.opensearch_client.indices.exists(index=self.index_name)
+            if index_exists:
+                print(f"KNN index '{self.index_name}' already exists.")
+            else:
+                self.create_index(embedding_dimension, space_type)
+            return True
+        except Exception as ex:
+            print(f"Error verifying or creating index: {ex}")
+            return False
+
+    def get_truncated_name(self, base_name, max_length=32):
+        if len(base_name) <= max_length:
+            return base_name
+        return base_name[:max_length-3] + "..."
+
+    def setup_command(self):
+        self.check_and_configure_aws()
+        self.setup_configuration()
+        
+        if not self.initialize_clients():
+            print("Failed to initialize AWS clients. Setup incomplete.")
+            return
+        
+        if self.is_serverless:
+            self.create_security_policies()
+            collection_id = self.get_collection_id(self.collection_name)
+            if not collection_id:
+                print(f"Collection '{self.collection_name}' not found. Attempting to create it...")
+                collection_id = self.create_collection(self.collection_name)
+            
+            if collection_id:
+                if self.wait_for_collection_active(collection_id):
+                    self.opensearch_endpoint = self.get_collection_endpoint()
+                    if not self.opensearch_endpoint:
+                        print("Failed to retrieve OpenSearch endpoint. Setup incomplete.")
+                        return
+                    else:
+                        self.config['opensearch_endpoint'] = self.opensearch_endpoint
+                else:
+                    print("Collection is not active. Setup incomplete.")
+                    return
+        else:
+            if not self.opensearch_endpoint:
+                print("OpenSearch endpoint not set. Setup incomplete.")
+                return
+        
+        if self.initialize_opensearch_client():
+            embedding_dimension, space_type = self.get_knn_index_details()
+            if self.verify_and_create_index(embedding_dimension, space_type):
+                print("Setup completed successfully.")
+                self.config['embedding_dimension'] = str(embedding_dimension)
+                self.config['space_type'] = space_type
+            else:
+                print("Index verification failed. Please check your index name and permissions.")
+        else:
+            print("Failed to initialize OpenSearch client. Setup incomplete.")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt b/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
new file mode 100644
index 00000000..dc41b248
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
@@ -0,0 +1,9 @@
+boto3
+opensearch-py
+pandas
+configparser
+PyPDF2
+tiktoken
+tqdm
+colorama
+requests_aws4auth
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
new file mode 100644
index 00000000..b73dbcf5
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
@@ -0,0 +1,15 @@
+from setuptools import setup, find_packages, find_namespace_packages
+
+
+
+
+setup(
+    name="rag_pipeline",
+    version="0.1.0",
+    packages=find_namespace_packages(include=['opensearch_py_ml', 'opensearch_py_ml.*']),
+    entry_points={
+        'console_scripts': [
+        'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
+        ],
+    },
+)
\ No newline at end of file

From dc94feb1d66c343522a22056c6242c547cc77bf2 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Sun, 17 Nov 2024 17:50:30 -0800
Subject: [PATCH 02/42] Added Licence Header and fixed .gitingore file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/.gitignore    |   3 +-
 .../ml_commons/rag_pipeline/rag/ingest.py     |  34 +++-
 .../rag_pipeline/rag/opensearch_connector.py  | 151 ++++++++++++++++++
 .../ml_commons/rag_pipeline/rag/query.py      |  33 +++-
 .../ml_commons/rag_pipeline/rag/rag.py        |  37 ++++-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  |  28 +++-
 .../ml_commons/rag_pipeline/rag/setup.py      |  26 ++-
 7 files changed, 291 insertions(+), 21 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
index 801d43ba..f5d53cbc 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
@@ -4,8 +4,7 @@ ml_commons/rag_pipeline/ingestion/
 ml_commons/rag_pipeline/rag/config.ini
 # Ignore virtual environment
 .venv/
-# Or, specify the full path
-/Users/hmumtazz/.cursor-tutor/opensearch-py-ml/.venv/
+
 
 # Ignore Python cache files
 __pycache__/
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 9bcfb316..e3c32a98 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -1,4 +1,27 @@
-# ingest_class.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 
 import os
 import glob
@@ -15,19 +38,19 @@
 import random
 
 
-from opensearch_class import OpenSearchClass
+from opensearch_connector import OpenSearchConnector
 
 init(autoreset=True)  # Initialize colorama
 
-class IngestClass:
-    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v1'
+class Ingest:
+    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v2:0'
 
     def __init__(self, config):
         self.config = config
         self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
         self.bedrock_client = None
-        self.opensearch = OpenSearchClass(config)
+        self.opensearch = OpenSearchConnector(config)
 
     def initialize_clients(self):
         try:
@@ -160,6 +183,7 @@ def process_and_ingest_data(self, file_paths: List[str]):
         for doc in all_documents:
             if 'embedding' in doc and doc['embedding'] is not None:
                 action = {
+                    "_op_type": "index",
                     "_index": self.index_name,
                     "_source": {
                         "nominee_text": doc['text'],
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
new file mode 100644
index 00000000..4be08779
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -0,0 +1,151 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth, exceptions as opensearch_exceptions
+import boto3
+from urllib.parse import urlparse
+from opensearchpy import helpers as opensearch_helpers
+
+class OpenSearchConnector:
+    def __init__(self, config):
+        self.config = config
+        self.opensearch_client = None
+        self.aws_region = config.get('region')
+        self.index_name = config.get('index_name')
+        self.is_serverless = config.get('is_serverless', 'False') == 'True'
+        self.opensearch_endpoint = config.get('opensearch_endpoint')
+        self.opensearch_username = config.get('opensearch_username')
+        self.opensearch_password = config.get('opensearch_password')
+
+    def initialize_opensearch_client(self):
+        if not self.opensearch_endpoint:
+            print("OpenSearch endpoint not set. Please run setup first.")
+            return False
+        
+        parsed_url = urlparse(self.opensearch_endpoint)
+        host = parsed_url.hostname
+        port = parsed_url.port or 443
+
+        if self.is_serverless:
+            credentials = boto3.Session().get_credentials()
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+        else:
+            if not self.opensearch_username or not self.opensearch_password:
+                print("OpenSearch username or password not set. Please run setup first.")
+                return False
+            auth = (self.opensearch_username, self.opensearch_password)
+
+        try:
+            self.opensearch_client = OpenSearch(
+                hosts=[{'host': host, 'port': port}],
+                http_auth=auth,
+                use_ssl=True,
+                verify_certs=True,
+                connection_class=RequestsHttpConnection,
+                pool_maxsize=20
+            )
+            print(f"Initialized OpenSearch client with host: {host} and port: {port}")
+            return True
+        except Exception as ex:
+            print(f"Error initializing OpenSearch client: {ex}")
+            return False
+
+    def create_index(self, embedding_dimension, space_type):
+        index_body = {
+            "mappings": {
+                "properties": {
+                    "nominee_text": {"type": "text"},
+                    "nominee_vector": {
+                        "type": "knn_vector",
+                        "dimension": embedding_dimension,
+                        "method": {
+                            "name": "hnsw",
+                            "space_type": space_type,
+                            "engine": "nmslib",
+                            "parameters": {"ef_construction": 512, "m": 16},
+                        },
+                    },
+                }
+            },
+            "settings": {
+                "index": {
+                    "number_of_shards": 2,
+                    "knn.algo_param": {"ef_search": 512},
+                    "knn": True,
+                }
+            },
+        }
+        try:
+            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
+            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
+        except opensearch_exceptions.RequestError as e:
+            if 'resource_already_exists_exception' in str(e).lower():
+                print(f"Index '{self.index_name}' already exists.")
+            else:
+                print(f"Error creating index '{self.index_name}': {e}")
+
+    def verify_and_create_index(self, embedding_dimension, space_type):
+        try:
+            index_exists = self.opensearch_client.indices.exists(index=self.index_name)
+            if index_exists:
+                print(f"KNN index '{self.index_name}' already exists.")
+            else:
+                self.create_index(embedding_dimension, space_type)
+            return True
+        except Exception as ex:
+            print(f"Error verifying or creating index: {ex}")
+            return False
+
+    def bulk_index(self, actions):
+        try:
+            success_count, error_info = opensearch_helpers.bulk(self.opensearch_client, actions)
+            error_count = len(error_info)
+            print(f"Indexed {success_count} documents successfully. Failed to index {error_count} documents.")
+            return success_count, error_count
+        except Exception as e:
+            print(f"Error during bulk indexing: {e}")
+            return 0, len(actions)
+
+    def search(self, vector, k=5):
+        try:
+            response = self.opensearch_client.search(
+                index=self.index_name,
+                body={
+                    "size": k,
+                    "_source": ["nominee_text"],
+                    "query": {
+                        "knn": {
+                            "nominee_vector": {
+                                "vector": vector,
+                                "k": k
+                            }
+                        }
+                    }
+                }
+            )
+            return response['hits']['hits']
+        except Exception as e:
+            print(f"Error during search: {e}")
+            return []
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index d4305c90..9e64a9a1 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -1,4 +1,27 @@
-# query_class.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 
 import json
 import tiktoken
@@ -8,12 +31,12 @@
 import botocore
 import time
 import random
-from opensearch_class import OpenSearchClass
+from opensearch_connector import OpenSearchConnector
 
 init(autoreset=True)  # Initialize colorama
 
-class QueryClass:
-    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v1'
+class Query:
+    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v2:0'
     LLM_MODEL_ID = 'amazon.titan-text-express-v1'
 
     def __init__(self, config):
@@ -21,7 +44,7 @@ def __init__(self, config):
         self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
         self.bedrock_client = None
-        self.opensearch = OpenSearchClass(config)
+        self.opensearch = OpenSearchConnector(config)
 
     def initialize_clients(self):
         try:
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 80f57875..3fdf8c90 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -1,3 +1,28 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
 #!/usr/bin/env python3
 
 """
@@ -6,9 +31,9 @@
 
 import argparse
 import configparser
-from rag_setup import SetupClass
-from ingest import IngestClass
-from query import QueryClass
+from rag_setup import Setup
+from ingest import Ingest
+from query import Query
 
 CONFIG_FILE = 'config.ini'
 
@@ -35,7 +60,7 @@ def main():
     config = load_config()
 
     if args.command == 'setup':
-        setup = SetupClass()
+        setup = Setup()
         setup.setup_command()
         save_config(setup.config)
     elif args.command == 'ingest':
@@ -48,7 +73,7 @@ def main():
                 paths.append(path)
         else:
             paths = args.paths
-        ingest = IngestClass(config)
+        ingest = Ingest(config)
         ingest.ingest_command(paths)
     elif args.command == 'query':
         if not args.queries:
@@ -60,7 +85,7 @@ def main():
                 queries.append(query)
         else:
             queries = args.queries
-        query = QueryClass(config)
+        query = Query(config)
         query.query_command(queries, num_results=args.num_results)
     else:
         parser.print_help()
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 47c03b9e..3795e7b8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -1,4 +1,28 @@
-# setup_class.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
 import boto3
 import botocore
 from botocore.config import Config
@@ -13,7 +37,7 @@
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
 
-class SetupClass:
+class Setup:
     CONFIG_FILE = 'config.ini'
     SERVICE_AOSS = 'opensearchserverless'
     SERVICE_BEDROCK = 'bedrock-runtime'
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
index b73dbcf5..7f625056 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
@@ -1,5 +1,29 @@
-from setuptools import setup, find_packages, find_namespace_packages
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
 
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+from setuptools import setup, find_packages, find_namespace_packages
 
 
 

From cba567c7b310f6fc0106621c7d394cd7b241ab1f Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Sun, 17 Nov 2024 18:27:09 -0800
Subject: [PATCH 03/42] Added comments to understand code

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/config.ini    | 11 ++++++
 .../ml_commons/rag_pipeline/rag/ingest.py     | 25 ++++++++++++-
 .../rag_pipeline/rag/opensearch_connector.py  | 12 +++++++
 .../ml_commons/rag_pipeline/rag/query.py      | 15 ++++++++
 .../ml_commons/rag_pipeline/rag/rag.py        | 12 ++++++-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 35 ++++++++++++++-----
 .../ml_commons/rag_pipeline/rag/setup.py      | 16 ++++++---
 7 files changed, 112 insertions(+), 14 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini b/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini
new file mode 100644
index 00000000..0f79486a
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini
@@ -0,0 +1,11 @@
+[DEFAULT]
+region = us-west-2
+iam_principal = arn:aws:iam::615299771255:user/hmumtazz
+index_name = drpepper
+collection_name = 
+is_serverless = False
+opensearch_endpoint = https://search-hashim-test5-eivrlyacr3n653fnkkrg2yab7u.aos.us-west-2.on.aws
+opensearch_username = admin
+opensearch_password = MyPassword123!
+embedding_dimension = 768
+space_type = l2
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index e3c32a98..6942e4ee 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -46,6 +46,7 @@ class Ingest:
     EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v2:0'
 
     def __init__(self, config):
+        # Initialize the Ingest class with configuration
         self.config = config
         self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
@@ -53,6 +54,8 @@ def __init__(self, config):
         self.opensearch = OpenSearchConnector(config)
 
     def initialize_clients(self):
+        # Initialize AWS Bedrock and OpenSearch clients
+        # Returns True if successful, False otherwise
         try:
             self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
             if self.opensearch.initialize_opensearch_client():
@@ -66,6 +69,9 @@ def initialize_clients(self):
             return False
 
     def process_file(self, file_path: str) -> List[Dict[str, str]]:
+        # Process a file based on its extension
+        # Supports CSV, TXT, and PDF files
+        # Returns a list of dictionaries containing extracted text
         _, file_extension = os.path.splitext(file_path)
         
         if file_extension.lower() == '.csv':
@@ -79,6 +85,9 @@ def process_file(self, file_path: str) -> List[Dict[str, str]]:
             return []
 
     def process_csv(self, file_path: str) -> List[Dict[str, str]]:
+        # Process a CSV file
+        # Extracts information and formats it into a sentence
+        # Returns a list of dictionaries with the formatted text
         documents = []
         with open(file_path, 'r') as csvfile:
             reader = csv.DictReader(csvfile)
@@ -90,11 +99,17 @@ def process_csv(self, file_path: str) -> List[Dict[str, str]]:
         return documents
 
     def process_txt(self, file_path: str) -> List[Dict[str, str]]:
+        # Process a TXT file
+        # Reads the entire content of the file
+        # Returns a list with a single dictionary containing the file content
         with open(file_path, 'r') as txtfile:
             content = txtfile.read()
         return [{"text": content}]
 
     def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
+        # Process a PDF file
+        # Extracts text from each page of the PDF
+        # Returns a list of dictionaries, each containing text from a page
         documents = []
         with open(file_path, 'rb') as pdffile:
             pdf_reader = PyPDF2.PdfReader(pdffile)
@@ -105,6 +120,9 @@ def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
         return documents
 
     def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        # Generate text embedding using AWS Bedrock
+        # Implements exponential backoff for retries in case of failures
+        # Returns the embedding if successful, None otherwise
         if self.bedrock_client is None:
             print("Bedrock client is not initialized. Please run setup first.")
             return None
@@ -139,6 +157,9 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
         return None
 
     def process_and_ingest_data(self, file_paths: List[str]):
+        # Process and ingest data from multiple files
+        # Generates embeddings for each document and ingests into OpenSearch
+        # Displays progress and results of the ingestion process
         if not self.initialize_clients():
             print("Failed to initialize clients. Aborting ingestion.")
             return
@@ -197,6 +218,8 @@ def process_and_ingest_data(self, file_paths: List[str]):
         print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
 
     def ingest_command(self, paths: List[str]):
+        # Main ingestion command
+        # Processes all valid files in the given paths and initiates ingestion
         all_files = []
         for path in paths:
             if os.path.isfile(path):
@@ -215,4 +238,4 @@ def ingest_command(self, paths: List[str]):
         
         print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
         
-        self.process_and_ingest_data(valid_files)
+        self.process_and_ingest_data(valid_files)
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 4be08779..73b23a7b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -30,6 +30,7 @@
 
 class OpenSearchConnector:
     def __init__(self, config):
+        # Initialize the OpenSearchConnector with configuration
         self.config = config
         self.opensearch_client = None
         self.aws_region = config.get('region')
@@ -40,6 +41,9 @@ def __init__(self, config):
         self.opensearch_password = config.get('opensearch_password')
 
     def initialize_opensearch_client(self):
+        # Initialize the OpenSearch client
+        # Handles both serverless and non-serverless configurations
+        # Returns True if successful, False otherwise
         if not self.opensearch_endpoint:
             print("OpenSearch endpoint not set. Please run setup first.")
             return False
@@ -73,6 +77,8 @@ def initialize_opensearch_client(self):
             return False
 
     def create_index(self, embedding_dimension, space_type):
+        # Create a new KNN index in OpenSearch
+        # Sets up the mapping for nominee_text and nominee_vector fields
         index_body = {
             "mappings": {
                 "properties": {
@@ -107,6 +113,8 @@ def create_index(self, embedding_dimension, space_type):
                 print(f"Error creating index '{self.index_name}': {e}")
 
     def verify_and_create_index(self, embedding_dimension, space_type):
+        # Check if the index exists, create it if it doesn't
+        # Returns True if the index exists or was successfully created, False otherwise
         try:
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
@@ -119,6 +127,8 @@ def verify_and_create_index(self, embedding_dimension, space_type):
             return False
 
     def bulk_index(self, actions):
+        # Perform bulk indexing of documents
+        # Returns the number of successfully indexed documents and the number of failures
         try:
             success_count, error_info = opensearch_helpers.bulk(self.opensearch_client, actions)
             error_count = len(error_info)
@@ -129,6 +139,8 @@ def bulk_index(self, actions):
             return 0, len(actions)
 
     def search(self, vector, k=5):
+        # Perform a KNN search using the provided vector
+        # Returns the top k matching documents
         try:
             response = self.opensearch_client.search(
                 index=self.index_name,
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 9e64a9a1..6fb0a5d5 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -40,6 +40,7 @@ class Query:
     LLM_MODEL_ID = 'amazon.titan-text-express-v1'
 
     def __init__(self, config):
+        # Initialize the Query class with configuration
         self.config = config
         self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
@@ -47,6 +48,8 @@ def __init__(self, config):
         self.opensearch = OpenSearchConnector(config)
 
     def initialize_clients(self):
+        # Initialize AWS Bedrock and OpenSearch clients
+        # Returns True if successful, False otherwise
         try:
             self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
             if self.opensearch.initialize_opensearch_client():
@@ -60,6 +63,9 @@ def initialize_clients(self):
             return False
 
     def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        # Generate text embedding using AWS Bedrock
+        # Implements exponential backoff for retries in case of failures
+        # Returns the embedding if successful, None otherwise
         if self.bedrock_client is None:
             print("Bedrock client is not initialized. Please run setup first.")
             return None
@@ -94,6 +100,9 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
         return None
 
     def bulk_query(self, queries, k=5):
+        # Perform bulk semantic search for multiple queries
+        # Generates embeddings for queries and searches OpenSearch index
+        # Returns a list of results containing query, context, and number of results
         print("Generating embeddings for queries...")
         query_vectors = []
         for query in queries:
@@ -133,6 +142,9 @@ def bulk_query(self, queries, k=5):
         return results
 
     def generate_answer(self, prompt, config):
+        # Generate an answer using the LLM model
+        # Handles token limit and configures LLM parameters
+        # Returns the generated answer or None if an error occurs
         try:
             max_input_tokens = 8192  # Max tokens for the model
             expected_output_tokens = config.get('maxTokenCount', 1000)
@@ -172,6 +184,9 @@ def generate_answer(self, prompt, config):
             return None
 
     def query_command(self, queries: List[str], num_results=5):
+        # Main query command to process multiple queries
+        # Performs semantic search and generates answers using LLM
+        # Prints results for each query
         if not self.initialize_clients():
             print("Failed to initialize clients. Aborting query.")
             return
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 3fdf8c90..30043cf9 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -38,17 +38,20 @@
 CONFIG_FILE = 'config.ini'
 
 def load_config():
+    # Load configuration from the config file
     config = configparser.ConfigParser()
     config.read(CONFIG_FILE)
     return config['DEFAULT']
 
 def save_config(config):
+    # Save configuration to the config file
     parser = configparser.ConfigParser()
     parser['DEFAULT'] = config
     with open(CONFIG_FILE, 'w') as f:
         parser.write(f)
     
 def main():
+    # Set up argument parser for CLI
     parser = argparse.ArgumentParser(description="RAG Pipeline CLI")
     parser.add_argument('command', choices=['setup', 'ingest', 'query'], help='Command to run')
     parser.add_argument('--paths', nargs='+', help='Paths to files or directories for ingestion')
@@ -57,14 +60,18 @@ def main():
 
     args = parser.parse_args()
 
+    # Load existing configuration
     config = load_config()
 
     if args.command == 'setup':
+        # Run setup process
         setup = Setup()
         setup.setup_command()
         save_config(setup.config)
     elif args.command == 'ingest':
+        # Handle ingestion command
         if not args.paths:
+            # If no paths provided as arguments, prompt user for input
             paths = []
             while True:
                 path = input("Enter a file or directory path (or press Enter to finish): ")
@@ -76,7 +83,9 @@ def main():
         ingest = Ingest(config)
         ingest.ingest_command(paths)
     elif args.command == 'query':
+        # Handle query command
         if not args.queries:
+            # If no queries provided as arguments, prompt user for input
             queries = []
             while True:
                 query = input("Enter a query (or press Enter to finish): ")
@@ -88,7 +97,8 @@ def main():
         query = Query(config)
         query.query_command(queries, num_results=args.num_results)
     else:
+        # If an invalid command is provided, print help
         parser.print_help()
 
 if __name__ == "__main__":
-    main()
\ No newline at end of file
+    main()
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 3795e7b8..14a334b8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -37,12 +37,15 @@
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
 
+# [Existing license and import statements remain unchanged]
+
 class Setup:
     CONFIG_FILE = 'config.ini'
     SERVICE_AOSS = 'opensearchserverless'
     SERVICE_BEDROCK = 'bedrock-runtime'
 
     def __init__(self):
+        # Initialize setup variables
         self.aws_region = None
         self.iam_principal = None
         self.index_name = None
@@ -56,6 +59,7 @@ def __init__(self):
         self.opensearch_client = None
 
     def check_and_configure_aws(self):
+        # Check if AWS credentials are configured and offer to reconfigure if needed
         try:
             session = boto3.Session()
             credentials = session.get_credentials()
@@ -73,6 +77,7 @@ def check_and_configure_aws(self):
             self.configure_aws()
 
     def configure_aws(self):
+        # Configure AWS credentials using user input
         print("Let's configure your AWS credentials.")
 
         aws_access_key_id = input("Enter your AWS Access Key ID: ")
@@ -102,20 +107,22 @@ def configure_aws(self):
             print(f"An unexpected error occurred: {e}")
 
     def load_config(self):
+        # Load configuration from the config file
         config = configparser.ConfigParser()
         if os.path.exists(self.CONFIG_FILE):
             config.read(self.CONFIG_FILE)
             return dict(config['DEFAULT'])
         return {}
 
-
     def save_config(self, config):
+        # Save configuration to the config file
         parser = configparser.ConfigParser()
         parser['DEFAULT'] = config
         with open(self.CONFIG_FILE, 'w') as f:
             parser.write(f)
 
-    def get_password_with_asterisks(self, prompt="Enter password: "):  # Accept 'prompt'
+    def get_password_with_asterisks(self, prompt="Enter password: "):
+        # Get password input from user, masking it with asterisks
         import sys
         if sys.platform == 'win32':
             import msvcrt
@@ -162,6 +169,7 @@ def get_password_with_asterisks(self, prompt="Enter password: "):  # Accept 'pro
                 termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
 
     def setup_configuration(self):
+        # Set up the configuration by prompting the user for various settings
         config = self.load_config()
 
         self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
@@ -197,6 +205,7 @@ def setup_configuration(self):
         print("Configuration saved successfully.")
 
     def initialize_clients(self):
+        # Initialize AWS clients (AOSS and Bedrock)
         try:
             boto_config = Config(
                 region_name=self.aws_region,
@@ -215,6 +224,7 @@ def initialize_clients(self):
             return False
 
     def create_security_policies(self):
+        # Create security policies for serverless OpenSearch
         if not self.is_serverless:
             print("Security policies are not applicable for managed OpenSearch domains.")
             return
@@ -244,6 +254,7 @@ def create_security_policies(self):
         self.create_access_policy(self.get_truncated_name(f"{self.collection_name}-access-policy"), f"{self.collection_name} data access policy", data_access_policy)
 
     def create_security_policy(self, policy_type, name, description, policy_body):
+        # Create a specific security policy (encryption or network)
         try:
             if policy_type.lower() == "encryption":
                 self.aoss_client.create_security_policy(description=description, name=name, policy=policy_body, type="encryption")
@@ -258,6 +269,7 @@ def create_security_policy(self, policy_type, name, description, policy_body):
             print(f"Error creating {policy_type} policy '{name}': {ex}")
 
     def create_access_policy(self, name, description, policy_body):
+        # Create a data access policy
         try:
             self.aoss_client.create_access_policy(description=description, name=name, policy=policy_body, type="data")
             print(f"Data Access Policy '{name}' created successfully.")
@@ -267,6 +279,7 @@ def create_access_policy(self, name, description, policy_body):
             print(f"Error creating data access policy '{name}': {ex}")
 
     def create_collection(self, collection_name, max_retries=3):
+        # Create an OpenSearch serverless collection
         for attempt in range(max_retries):
             try:
                 response = self.aoss_client.create_collection(
@@ -287,6 +300,7 @@ def create_collection(self, collection_name, max_retries=3):
         return None
 
     def get_collection_id(self, collection_name):
+        # Retrieve the ID of an existing collection
         try:
             response = self.aoss_client.list_collections()
             for collection in response['collectionSummaries']:
@@ -297,6 +311,7 @@ def get_collection_id(self, collection_name):
         return None
 
     def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
+        # Wait for the collection to become active
         print(f"Waiting for collection '{self.collection_name}' to become active...")
         start_time = time.time()
         while time.time() - start_time < max_wait_minutes * 60:
@@ -319,6 +334,7 @@ def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
         return False
 
     def get_collection_endpoint(self):
+        # Retrieve the endpoint URL for the OpenSearch collection
         if not self.is_serverless:
             return self.opensearch_endpoint
         
@@ -347,6 +363,7 @@ def get_collection_endpoint(self):
             return None
 
     def initialize_opensearch_client(self):
+        # Initialize the OpenSearch client
         if not self.opensearch_endpoint:
             print("OpenSearch endpoint not set. Please run setup first.")
             return False
@@ -366,7 +383,7 @@ def initialize_opensearch_client(self):
 
         try:
             self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'port': port}],
+                hosts=[{'host': host, 'portort': port}],
                 http_auth=auth,
                 use_ssl=True,
                 verify_certs=True,
@@ -380,7 +397,7 @@ def initialize_opensearch_client(self):
             return False
 
     def get_knn_index_details(self):
-        # Simplified dimension input
+        # Prompt user for KNN index details (embedding dimension and space type)
         dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ")
         
         if dimension_input.strip() == "":
@@ -394,7 +411,6 @@ def get_knn_index_details(self):
 
         print(f"\nEmbedding dimension set to: {embedding_dimension}")
 
-        # Space type selection
         print("\nChoose the space type for KNN:")
         print("1. L2 (Euclidean distance)")
         print("2. Cosine similarity")
@@ -415,8 +431,8 @@ def get_knn_index_details(self):
 
         return embedding_dimension, space_type
 
-
     def create_index(self, embedding_dimension, space_type):
+        # Create the KNN index in OpenSearch
         index_body = {
             "mappings": {
                 "properties": {
@@ -451,6 +467,7 @@ def create_index(self, embedding_dimension, space_type):
                 print(f"Error creating index '{self.index_name}': {e}")
 
     def verify_and_create_index(self, embedding_dimension, space_type):
+        # Verify if the index exists, create it if it doesn't
         try:
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
@@ -463,11 +480,13 @@ def verify_and_create_index(self, embedding_dimension, space_type):
             return False
 
     def get_truncated_name(self, base_name, max_length=32):
+        # Truncate a name to fit within a specified length
         if len(base_name) <= max_length:
             return base_name
         return base_name[:max_length-3] + "..."
 
     def setup_command(self):
+        # Main setup command that orchestrates the entire setup process
         self.check_and_configure_aws()
         self.setup_configuration()
         
@@ -502,9 +521,9 @@ def setup_command(self):
             embedding_dimension, space_type = self.get_knn_index_details()
             if self.verify_and_create_index(embedding_dimension, space_type):
                 print("Setup completed successfully.")
-                self.config['embedding_dimension'] = str(embedding_dimension)
+                self.config['embedding_dimension'] = s= str(embedding_dimension)
                 self.config['space_type'] = space_type
             else:
                 print("Index verification failed. Please check your index name and permissions.")
         else:
-            print("Failed to initialize OpenSearch client. Setup incomplete.")
\ No newline at end of file
+            print("Failed to initialize OpenSearch client. Setup incomplete.")
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
index 7f625056..1c806760 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
@@ -25,15 +25,23 @@
 
 from setuptools import setup, find_packages, find_namespace_packages
 
-
-
 setup(
+    # Name of the package
     name="rag_pipeline",
+    
+    # Version of the package
     version="0.1.0",
+    
+    # Automatically find and include all packages in the project
+    # This specifically looks for packages within 'opensearch_py_ml' and its subpackages
     packages=find_namespace_packages(include=['opensearch_py_ml', 'opensearch_py_ml.*']),
+    
+    # Define console script entry points
+    # This creates a command-line executable named 'rag' that runs the main() function
+    # from the opensearch_py_ml.ml_commons.rag_pipeline.rag module
     entry_points={
         'console_scripts': [
-        'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
+            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
         ],
     },
-)
\ No newline at end of file
+)

From 3481c3e0826bf0f2d0ad727dc777ab9e7f4b089d Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Sun, 17 Nov 2024 18:31:00 -0800
Subject: [PATCH 04/42] Remove sensitive config file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/config.ini            | 11 -----------
 1 file changed, 11 deletions(-)
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini b/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini
deleted file mode 100644
index 0f79486a..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/config.ini
+++ /dev/null
@@ -1,11 +0,0 @@
-[DEFAULT]
-region = us-west-2
-iam_principal = arn:aws:iam::615299771255:user/hmumtazz
-index_name = drpepper
-collection_name = 
-is_serverless = False
-opensearch_endpoint = https://search-hashim-test5-eivrlyacr3n653fnkkrg2yab7u.aos.us-west-2.on.aws
-opensearch_username = admin
-opensearch_password = MyPassword123!
-embedding_dimension = 768
-space_type = l2

From e6eee3028b2c73fbeffa0c84deff18aecea5a87e Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Sun, 17 Nov 2024 21:41:04 -0800
Subject: [PATCH 05/42] Simplify the selection process for the ef_construction
 parameter by offering a suggested default value with the flexibility for
 users to enter a custom value if needed.

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/rag.py        |  4 +-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 50 +++++++++++++------
 2 files changed, 39 insertions(+), 15 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 30043cf9..b9b09ef1 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -1,3 +1,5 @@
+#!/usr/bin/env python3
+
 # SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
@@ -23,7 +25,7 @@
 #  specific language governing permissions and limitations
 #  under the License.
 
-#!/usr/bin/env python3
+
 
 """
 Main CLI script for OpenSearch with Bedrock Integration
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 14a334b8..d75d8eb7 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -370,7 +370,7 @@ def initialize_opensearch_client(self):
         
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = parsed_url.port or 443
+        port = 443
 
         if self.is_serverless:
             credentials = boto3.Session().get_credentials()
@@ -383,7 +383,7 @@ def initialize_opensearch_client(self):
 
         try:
             self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'portort': port}],
+                hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
                 use_ssl=True,
                 verify_certs=True,
@@ -397,7 +397,7 @@ def initialize_opensearch_client(self):
             return False
 
     def get_knn_index_details(self):
-        # Prompt user for KNN index details (embedding dimension and space type)
+        # Prompt user for KNN index details (embedding dimension, space type, and ef_construction)
         dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ")
         
         if dimension_input.strip() == "":
@@ -429,9 +429,24 @@ def get_knn_index_details(self):
 
         print(f"Space type set to: {space_type}")
 
-        return embedding_dimension, space_type
+        # New prompt for ef_construction
+        ef_construction_input = input("\nPress Enter to use the default ef_construction value (512), or type a custom value: ")
+        
+        if ef_construction_input.strip() == "":
+            ef_construction = 512
+        else:
+            try:
+                ef_construction = int(ef_construction_input)
+            except ValueError:
+                print("Invalid input. Using default ef_construction of 512.")
+                ef_construction = 512
+
+        print(f"ef_construction set to: {ef_construction}")
 
-    def create_index(self, embedding_dimension, space_type):
+        return embedding_dimension, space_type, ef_construction
+
+
+    def create_index(self, embedding_dimension, space_type, ef_construction):
         # Create the KNN index in OpenSearch
         index_body = {
             "mappings": {
@@ -444,7 +459,7 @@ def create_index(self, embedding_dimension, space_type):
                             "name": "hnsw",
                             "space_type": space_type,
                             "engine": "nmslib",
-                            "parameters": {"ef_construction": 512, "m": 16},
+                            "parameters": {"ef_construction": ef_construction, "m": 16},
                         },
                     },
                 }
@@ -459,26 +474,31 @@ def create_index(self, embedding_dimension, space_type):
         }
         try:
             self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
+            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.")
         except Exception as e:
             if 'resource_already_exists_exception' in str(e).lower():
                 print(f"Index '{self.index_name}' already exists.")
             else:
                 print(f"Error creating index '{self.index_name}': {e}")
 
-    def verify_and_create_index(self, embedding_dimension, space_type):
-        # Verify if the index exists, create it if it doesn't
+
+
+    def verify_and_create_index(self, embedding_dimension, space_type, ef_construction):
         try:
+            print(f"Attempting to verify index '{self.index_name}'...")
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
                 print(f"KNN index '{self.index_name}' already exists.")
             else:
-                self.create_index(embedding_dimension, space_type)
+                print(f"Index '{self.index_name}' does not exist. Attempting to create...")
+                self.create_index(embedding_dimension, space_type, ef_construction)
             return True
         except Exception as ex:
             print(f"Error verifying or creating index: {ex}")
+            print(f"OpenSearch client config: {self.opensearch_client.transport.hosts}")
             return False
 
+
     def get_truncated_name(self, base_name, max_length=32):
         # Truncate a name to fit within a specified length
         if len(base_name) <= max_length:
@@ -518,12 +538,14 @@ def setup_command(self):
                 return
         
         if self.initialize_opensearch_client():
-            embedding_dimension, space_type = self.get_knn_index_details()
-            if self.verify_and_create_index(embedding_dimension, space_type):
+            print("OpenSearch client initialized successfully. Proceeding with index creation...")
+            embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
+            if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
                 print("Setup completed successfully.")
-                self.config['embedding_dimension'] = s= str(embedding_dimension)
+                self.config['embedding_dimension'] = str(embedding_dimension)
                 self.config['space_type'] = space_type
+                self.config['ef_construction'] = str(ef_construction)
             else:
                 print("Index verification failed. Please check your index name and permissions.")
         else:
-            print("Failed to initialize OpenSearch client. Setup incomplete.")
+            print("Failed to initialize OpenSearch client. Setup incomplete.")
\ No newline at end of file

From 8b7aa0ea27a46d1f13aa2adc2a328c716b292257 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Wed, 20 Nov 2024 20:05:01 -0800
Subject: [PATCH 06/42] Allows Customer to register model via CLI, fixed
 embedding generation, addressed comments, fixed upload csv method

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/.gitignore    |  71 +-
 .../rag_pipeline/rag/AIConnectorHelper.py     | 698 ++++++++++++++++++
 .../ml_commons/rag_pipeline/rag/ingest.py     | 103 +--
 .../rag_pipeline/rag/opensearch_class.py      | 127 ----
 .../ml_commons/rag_pipeline/rag/query.py      |  68 +-
 .../ml_commons/rag_pipeline/rag/rag.py        |  10 +-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 427 ++++++++++-
 7 files changed, 1282 insertions(+), 222 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
index f5d53cbc..f6c330e7 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
@@ -2,10 +2,71 @@
 ml_commons/rag_pipeline/data/
 ml_commons/rag_pipeline/ingestion/
 ml_commons/rag_pipeline/rag/config.ini
-# Ignore virtual environment
-.venv/
+# Compiled python modules.
+*.pyc
+__pycache__/
 
+# Setuptools distribution folder.
+dist/
 
-# Ignore Python cache files
-__pycache__/
-*.pyc
+# Build folder
+build/
+
+# docs build folder
+docs/build/
+
+# pytest results
+tests/dataframe/results/*csv
+result_images/
+
+
+# Python egg metadata, regenerated from source files by setuptools.
+/*.egg-info
+opensearch_py_ml.egg-info/
+
+# PyCharm files
+.idea/
+
+# vscode files
+.vscode/
+
+# pytest files
+.pytest_cache/
+
+# Ignore MacOSX files
+.DS_Store
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+.python-version
+
+# Environments
+.env
+.venv
+.nox
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+.mypy_cache
+
+# Coverage
+.coverage
+.coverage.*
+*-junit.xml
+*-codecov.xml
+
+#model file
+all-MiniLM-L6-v2_torchscript_sentence-transformer.zip
+# torch generated files
+tests/test_SentenceTransformerModel
+tests/ml_commons/test_model_files
+tests/ml_models/tests
+docs/source/examples/synthetic_queries
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
new file mode 100644
index 00000000..efe62896
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -0,0 +1,698 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+
+import boto3
+from botocore.exceptions import BotoCoreError
+import json
+import requests
+from requests.auth import HTTPBasicAuth
+from requests_aws4auth import AWS4Auth
+import time
+from opensearchpy import OpenSearch, RequestsHttpConnection
+
+# This Python code is compatible with AWS OpenSearch versions 2.9 and higher.
+class AIConnectorHelper:
+    def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
+                 opensearch_domain_password, aws_user_name, aws_role_name):
+        """
+        Initialize the AIConnectorHelper with necessary AWS and OpenSearch configurations.
+        """
+        self.region = region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_domain_username = opensearch_domain_username
+        self.opensearch_domain_password = opensearch_domain_password
+        self.aws_user_name = aws_user_name
+        self.aws_role_name = aws_role_name
+
+        # Retrieve the OpenSearch domain endpoint and ARN
+        domain_endpoint, domain_arn = self.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+        if domain_arn:
+            self.opensearch_domain_arn = domain_arn
+        else:
+            print("Warning: Could not retrieve OpenSearch domain ARN.")
+            self.opensearch_domain_arn = None
+
+        if domain_endpoint:
+            # Construct the full domain URL
+            self.opensearch_domain_url = f'https://{domain_endpoint}'
+        else:
+            print("Warning: Could not retrieve OpenSearch domain endpoint.")
+            self.opensearch_domain_url = None
+
+        # Initialize the OpenSearch client
+        self.opensearch_client = OpenSearch(
+            hosts=[{'host': domain_endpoint, 'port': 443}],
+            http_auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+            use_ssl=True,
+            verify_certs=True,
+            connection_class=RequestsHttpConnection
+        )
+    @staticmethod
+    def get_opensearch_domain_info(region, domain_name):
+        """
+        Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
+        """
+        try:
+            opensearch_client = boto3.client('opensearch', region_name=region)
+            response = opensearch_client.describe_domain(DomainName=domain_name)
+            domain_status = response['DomainStatus']
+            domain_endpoint = domain_status.get('Endpoint')
+            domain_arn = domain_status['ARN']
+            return domain_endpoint, domain_arn
+        except Exception as e:
+            print(f"Error retrieving OpenSearch domain info: {e}")
+            return None, None
+        
+    def get_user_arn(self, username):
+        if not username:
+            return None
+        # Create a boto3 client for IAM
+        iam_client = boto3.client('iam')
+
+        try:
+            # Get information about the IAM user
+            response = iam_client.get_user(UserName=username)
+            user_arn = response['User']['Arn']
+            return user_arn
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f"IAM user '{username}' not found.")
+            return None
+
+    def secret_exists(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            # Try to get the secret
+            secretsmanager.get_secret_value(SecretId=secret_name)
+            # If no exception was raised by get_secret_value, the secret exists
+            return True
+        except secretsmanager.exceptions.ResourceNotFoundException:
+            # If a ResourceNotFoundException was raised, the secret does not exist
+            return False
+
+    def get_secret_arn(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            response = secretsmanager.describe_secret(SecretId=secret_name)
+            # Return ARN of the secret 
+            return response['ARN']
+        except secretsmanager.exceptions.ResourceNotFoundException:
+            print(f"The requested secret {secret_name} was not found")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+        
+    def get_secret(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            response = secretsmanager.get_secret_value(SecretId=secret_name)
+        except secretsmanager.exceptions.NoSuchEntityException:
+            print("The requested secret was not found")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+        else:
+            return response.get('SecretString')
+
+    def create_secret(self, secret_name, secret_value):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+
+        try:
+            response = secretsmanager.create_secret(
+                Name=secret_name,
+                SecretString=json.dumps(secret_value),
+            )
+            print(f'Secret {secret_name} created successfully.')
+            return response['ARN']  # Return the ARN of the created secret
+        except BotoCoreError as e:
+            print(f'Error creating secret: {e}')
+            return None
+
+
+    def role_exists(self, role_name):
+        iam_client = boto3.client('iam')
+
+        try:
+            iam_client.get_role(RoleName=role_name)
+            return True
+        except iam_client.exceptions.NoSuchEntityException:
+            return False
+
+    def delete_role(self, role_name):
+        iam_client = boto3.client('iam')
+
+        try:
+            # Detach managed policies
+            policies = iam_client.list_attached_role_policies(RoleName=role_name)['AttachedPolicies']
+            for policy in policies:
+                iam_client.detach_role_policy(RoleName=role_name, PolicyArn=policy['PolicyArn'])
+            print(f'All managed policies detached from role {role_name}.')
+
+            # Delete inline policies
+            inline_policies = iam_client.list_role_policies(RoleName=role_name)['PolicyNames']
+            for policy_name in inline_policies:
+                iam_client.delete_role_policy(RoleName=role_name, PolicyName=policy_name)
+            print(f'All inline policies deleted from role {role_name}.')
+
+            # Now, delete the role
+            iam_client.delete_role(RoleName=role_name)
+            print(f'Role {role_name} deleted.')
+
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f'Role {role_name} does not exist.')
+
+
+    def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
+        iam_client = boto3.client('iam')
+
+        try:
+            # Create the role with the trust policy
+            create_role_response = iam_client.create_role(
+                RoleName=role_name,
+                AssumeRolePolicyDocument=json.dumps(trust_policy_json),
+                Description='Role with custom trust and inline policies',
+            )
+
+            # Get the ARN of the newly created role
+            role_arn = create_role_response['Role']['Arn']
+
+            # Attach the inline policy to the role
+            iam_client.put_role_policy(
+                RoleName=role_name,
+                PolicyName='InlinePolicy',  # you can replace this with your preferred policy name
+                PolicyDocument=json.dumps(inline_policy_json)
+            )
+
+            print(f'Created role: {role_name}')
+            return role_arn
+
+        except Exception as e:
+            print(f"Error creating the role: {e}")
+            return None
+
+    def get_role_arn(self, role_name):
+        if not role_name:
+            return None
+        iam_client = boto3.client('iam')
+        try:
+            response = iam_client.get_role(RoleName=role_name)
+            # Return ARN of the role
+            return response['Role']['Arn']
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f"The requested role {role_name} does not exist")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+    
+    
+    def get_role_details(self, role_name):
+        iam = boto3.client('iam')
+
+        try:
+            response = iam.get_role(RoleName=role_name)
+            role = response['Role']
+
+            print(f"Role Name: {role['RoleName']}")
+            print(f"Role ID: {role['RoleId']}")
+            print(f"ARN: {role['Arn']}")
+            print(f"Creation Date: {role['CreateDate']}")
+            print("Assume Role Policy Document:")
+            print(json.dumps(role['AssumeRolePolicyDocument'], indent=4, sort_keys=True))
+
+            list_role_policies_response = iam.list_role_policies(RoleName=role_name)
+
+            for policy_name in list_role_policies_response['PolicyNames']:
+                get_role_policy_response = iam.get_role_policy(RoleName=role_name, PolicyName=policy_name)
+                print(f"Role Policy Name: {get_role_policy_response['PolicyName']}")
+                print("Role Policy Document:")
+                print(json.dumps(get_role_policy_response['PolicyDocument'], indent=4, sort_keys=True))
+
+        except iam.exceptions.NoSuchEntityException:
+            print(f'Role {role_name} does not exist.')
+
+    def map_iam_role_to_backend_role(self, iam_role_arn):
+        os_security_role = 'ml_full_access'  # Changed from 'all_access' to 'ml_full_access'
+        url = f'{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}'
+
+        payload = {
+            "backend_roles": [iam_role_arn]
+        }
+        headers = {'Content-Type': 'application/json'}
+
+        response = requests.put(url, auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+                                json=payload, headers=headers, verify=True)
+
+        if response.status_code == 200:
+            print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
+        else:
+            print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
+            print(f"Response: {response.text}")
+
+    def assume_role(self, create_connector_role_arn, role_session_name="your_session_name"):
+        sts_client = boto3.client('sts')
+
+        #role_arn = f"arn:aws:iam::{aws_account_id}:role/{role_name}"
+        assumed_role_object = sts_client.assume_role(
+            RoleArn=create_connector_role_arn,
+            RoleSessionName=role_session_name,
+        )
+
+        # Obtain the temporary credentials from the assumed role 
+        temp_credentials = assumed_role_object["Credentials"]
+
+        return temp_credentials
+    
+    def get_ml_auth(self, create_connector_role_name):
+        """
+        Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
+        """
+        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+        if not create_connector_role_arn:
+            raise Exception(f"IAM role '{create_connector_role_name}' not found.")
+
+        temp_credentials = self.assume_role(create_connector_role_arn)
+        awsauth = AWS4Auth(
+            temp_credentials["AccessKeyId"],
+            temp_credentials["SecretAccessKey"],
+            self.region,
+            'es',
+            session_token=temp_credentials["SessionToken"],
+        )
+        return awsauth
+
+    def create_connector(self, create_connector_role_name, payload):
+        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+        temp_credentials = self.assume_role(create_connector_role_arn)
+        awsauth = AWS4Auth(
+            temp_credentials["AccessKeyId"],
+            temp_credentials["SecretAccessKey"],
+            self.region,
+            'es',
+            session_token=temp_credentials["SessionToken"],
+        )
+
+        path = '/_plugins/_ml/connectors/_create'
+        url = self.opensearch_domain_url + path
+
+        headers = {"Content-Type": "application/json"}
+
+        r = requests.post(url, auth=awsauth, json=payload, headers=headers)
+        print(r.text)
+        connector_id = json.loads(r.text)['connector_id']
+        return connector_id
+    
+    def search_model_group(self, model_group_name):
+        payload = {
+            "query": {
+                "term": {
+                    "name.keyword": {
+                        "value": model_group_name
+                    }
+                }
+            }
+        }
+        headers = {"Content-Type": "application/json"}
+        
+        # Obtain temporary credentials
+        create_connector_role_arn = self.get_role_arn('my_test_create_bedrock_connector_role')  # Replace with actual role name
+        temp_credentials = self.assume_role(create_connector_role_arn)
+        awsauth = AWS4Auth(
+            temp_credentials["AccessKeyId"],
+            temp_credentials["SecretAccessKey"],
+            self.region,
+            'es',
+            session_token=temp_credentials["SessionToken"],
+        )
+        
+        r = requests.post(
+            f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_search',
+            auth=awsauth,
+            json=payload,
+            headers=headers
+        )
+        
+        response = json.loads(r.text)
+        return response
+    
+    def create_model_group(self, model_group_name, description, create_connector_role_name):
+        search_model_group_response = self.search_model_group(model_group_name)
+        print("Search Model Group Response:", search_model_group_response)
+        
+        if 'hits' in search_model_group_response and search_model_group_response['hits']['total']['value'] > 0:
+            return search_model_group_response['hits']['hits'][0]['_id']
+        
+        payload = {
+            "name": model_group_name,
+            "description": description
+        }
+        headers = {"Content-Type": "application/json"}
+        
+        # Obtain temporary credentials using the provided role name
+        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+        temp_credentials = self.assume_role(create_connector_role_arn)
+        awsauth = AWS4Auth(
+            temp_credentials["AccessKeyId"],
+            temp_credentials["SecretAccessKey"],
+            self.region,
+            'es',
+            session_token=temp_credentials["SessionToken"],
+        )
+        
+        r = requests.post(
+            f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_register',
+            auth=awsauth,
+            json=payload,
+            headers=headers
+        )
+        
+        print(r.text)
+        response = json.loads(r.text)
+        
+        if 'model_group_id' in response:
+            return response['model_group_id']
+        else:
+            # Handle error gracefully
+            raise KeyError("The response does not contain 'model_group_id'. Response content: {}".format(response))
+    
+    def get_task(self, task_id, create_connector_role_name):
+        try:
+            awsauth = self.get_ml_auth(create_connector_role_name)
+            r = requests.get(
+                f'{self.opensearch_domain_url}/_plugins/_ml/tasks/{task_id}',
+                auth=awsauth
+            )
+            print("Get Task Response:", r.text)
+            return r
+        except Exception as e:
+            print(f"Error in get_task: {e}")
+            raise
+    
+    def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
+        try:
+            model_group_id = self.create_model_group(model_name, description, create_connector_role_name)
+            payload = {
+                "name": model_name,
+                "function_name": "remote",
+                "description": description,
+                "model_group_id": model_group_id,
+                "connector_id": connector_id
+            }
+            headers = {"Content-Type": "application/json"}
+            deploy_str = str(deploy).lower()
+
+            awsauth = self.get_ml_auth(create_connector_role_name)
+
+            r = requests.post(
+                f'{self.opensearch_domain_url}/_plugins/_ml/models/_register?deploy={deploy_str}',
+                auth=awsauth,
+                json=payload,
+                headers=headers
+            )
+
+            print("Create Model Response:", r.text)
+            response = json.loads(r.text)
+
+            if 'model_id' in response:
+                return response['model_id']
+            elif 'task_id' in response:
+                # Handle asynchronous task
+                time.sleep(2)  # Wait for task to complete
+                task_response = self.get_task(response['task_id'], create_connector_role_name)
+                print("Task Response:", task_response.text)
+                task_result = json.loads(task_response.text)
+                if 'model_id' in task_result:
+                    return task_result['model_id']
+                else:
+                    raise KeyError(f"'model_id' not found in task response: {task_result}")
+            elif 'error' in response:
+                raise Exception(f"Error creating model: {response['error']}")
+            else:
+                raise KeyError(f"The response does not contain 'model_id' or 'task_id'. Response content: {response}")
+        except Exception as e:
+            print(f"Error in create_model: {e}")
+            raise
+    
+    def deploy_model(self, model_id):
+        headers = {"Content-Type": "application/json"}
+        return requests.post(f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy',
+                             auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
+                             headers=headers)
+    
+    def predict(self, model_id, payload):
+        headers = {"Content-Type": "application/json"}
+        r = requests.post(
+            f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_predict',
+            auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
+            json=payload,
+            headers=headers
+        )
+    
+    def create_connector_with_secret(self, secret_name, secret_value, connector_role_name, create_connector_role_name, create_connector_input, sleep_time_in_seconds=10):
+        # Step1: Create Secret
+        print('Step1: Create Secret')
+        if not self.secret_exists(secret_name):
+            secret_arn = self.create_secret(secret_name, secret_value)
+        else:
+            print('secret exists, skip creating')
+            secret_arn = self.get_secret_arn(secret_name)
+        #print(secret_arn)
+        print('----------')
+        
+        # Step2: Create IAM role configued in connector
+        trust_policy = {
+          "Version": "2012-10-17",
+          "Statement": [
+            {
+              "Effect": "Allow",
+              "Principal": {
+                "Service": "es.amazonaws.com"
+              },
+              "Action": "sts:AssumeRole"
+            }
+          ]
+        }
+
+        inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": [
+                        "secretsmanager:GetSecretValue",
+                        "secretsmanager:DescribeSecret"
+                    ],
+                    "Effect": "Allow",
+                    "Resource": secret_arn
+                }
+            ]
+        }
+
+        print('Step2: Create IAM role configued in connector')
+        if not self.role_exists(connector_role_name):
+            connector_role_arn = self.create_iam_role(connector_role_name, trust_policy, inline_policy)
+        else:
+            print('role exists, skip creating')
+            connector_role_arn = self.get_role_arn(connector_role_name)
+        #print(connector_role_arn)
+        print('----------')
+        
+        # Step 3: Configure IAM role in OpenSearch
+        # 3.1 Create IAM role for Signing create connector request
+        user_arn = self.get_user_arn(self.aws_user_name)
+        role_arn = self.get_role_arn(self.aws_role_name)
+        statements = []
+        if user_arn:
+            statements.append({
+                "Effect": "Allow",
+                "Principal": {
+                    "AWS": user_arn
+                },
+                "Action": "sts:AssumeRole"
+            })
+        if role_arn:
+            statements.append({
+                "Effect": "Allow",
+                "Principal": {
+                    "AWS": role_arn
+                },
+                "Action": "sts:AssumeRole"
+            })
+        trust_policy = {
+            "Version": "2012-10-17",
+            "Statement": statements
+        }
+
+        inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Effect": "Allow",
+                    "Action": "iam:PassRole",
+                    "Resource": connector_role_arn
+                },
+                {
+                    "Effect": "Allow",
+                    "Action": "es:ESHttpPost",
+                    "Resource": self.opensearch_domain_arn
+                }
+            ]
+        }
+
+        print('Step 3: Configure IAM role in OpenSearch')
+        print('Step 3.1: Create IAM role for Signing create connector request')
+        if not self.role_exists(create_connector_role_name):
+            create_connector_role_arn = self.create_iam_role(create_connector_role_name, trust_policy, inline_policy)
+        else:
+            print('role exists, skip creating')
+            create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+        #print(create_connector_role_arn)
+        print('----------')
+        
+        # 3.2 Map backend role
+        print(f'Step 3.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
+        self.map_iam_role_to_backend_role(create_connector_role_arn)
+        print('----------')
+        
+        # 4. Create connector
+        print('Step 4: Create connector in OpenSearch')
+        # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
+        # During this time, some services might not immediately recognize the new role or its permissions.
+        # So we wait for some time before creating connector.
+        # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
+        # you can rerun this function.
+        
+        # Wait for some time
+        time.sleep(sleep_time_in_seconds)
+        payload = create_connector_input
+        payload['credential'] = {
+            "secretArn": secret_arn,
+            "roleArn": connector_role_arn
+        }
+        connector_id = self.create_connector(create_connector_role_name, payload)
+        #print(connector_id)
+        print('----------')
+        return connector_id
+    
+    def create_connector_with_role(self, connector_role_inline_policy, connector_role_name, create_connector_role_name, create_connector_input, sleep_time_in_seconds=10):
+            # Step1: Create IAM role configued in connector
+            trust_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                "Effect": "Allow",
+                "Principal": {
+                    "Service": "es.amazonaws.com"
+                },
+                "Action": "sts:AssumeRole"
+                }
+            ]
+            }
+
+            print('Step1: Create IAM role configued in connector')
+            if not self.role_exists(connector_role_name):
+                connector_role_arn = self.create_iam_role(connector_role_name, trust_policy, connector_role_inline_policy)
+            else:
+                print('role exists, skip creating')
+                connector_role_arn = self.get_role_arn(connector_role_name)
+            #print(connector_role_arn)
+            print('----------')
+
+            # Step 2: Configure IAM role in OpenSearch
+            # 2.1 Create IAM role for Signing create connector request
+            user_arn = self.get_user_arn(self.aws_user_name)
+            role_arn = self.get_role_arn(self.aws_role_name)
+            statements = []
+            if user_arn:
+                statements.append({
+                    "Effect": "Allow",
+                    "Principal": {
+                        "AWS": user_arn
+                    },
+                    "Action": "sts:AssumeRole"
+                })
+            if role_arn:
+                statements.append({
+                    "Effect": "Allow",
+                    "Principal": {
+                        "AWS": role_arn
+                    },
+                    "Action": "sts:AssumeRole"
+                })
+            trust_policy = {
+                "Version": "2012-10-17",
+                "Statement": statements
+            }
+
+            inline_policy = {
+                "Version": "2012-10-17",
+                "Statement": [
+                    {
+                        "Effect": "Allow",
+                        "Action": "iam:PassRole",
+                        "Resource": connector_role_arn
+                    },
+                    {
+                        "Effect": "Allow",
+                        "Action": "es:ESHttpPost",
+                        "Resource": self.opensearch_domain_arn
+                    }
+                ]
+            }
+
+            print('Step 2: Configure IAM role in OpenSearch')
+            print('Step 2.1: Create IAM role for Signing create connector request')
+            if not self.role_exists(create_connector_role_name):
+                create_connector_role_arn = self.create_iam_role(create_connector_role_name, trust_policy, inline_policy)
+            else:
+                print('role exists, skip creating')
+                create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+            #print(create_connector_role_arn)
+            print('----------')
+
+            # 2.2 Map backend role
+            print(f'Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
+            self.map_iam_role_to_backend_role(create_connector_role_arn)
+            print('----------')
+
+            # 3. Create connector
+            print('Step 3: Create connector in OpenSearch')
+            # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
+            # During this time, some services might not immediately recognize the new role or its permissions.
+            # So we wait for some time before creating connector.
+            # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
+            # you can rerun this function.
+
+            # Wait for some time
+            time.sleep(sleep_time_in_seconds)
+            payload = create_connector_input
+            payload['credential'] = {
+                "roleArn": connector_role_arn
+            }
+            connector_id = self.create_connector(create_connector_role_name, payload)
+            #print(connector_id)
+            print('----------')
+            return connector_id
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 6942e4ee..38103251 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -43,7 +43,6 @@
 init(autoreset=True)  # Initialize colorama
 
 class Ingest:
-    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v2:0'
 
     def __init__(self, config):
         # Initialize the Ingest class with configuration
@@ -52,22 +51,22 @@ def __init__(self, config):
         self.index_name = config.get('index_name')
         self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
+        self.embedding_model_id = config.get('embedding_model_id')
+
+        if not self.embedding_model_id:
+            print("Embedding model ID is not set. Please run setup first.")
+            return
 
     def initialize_clients(self):
-        # Initialize AWS Bedrock and OpenSearch clients
-        # Returns True if successful, False otherwise
-        try:
-            self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
-            if self.opensearch.initialize_opensearch_client():
-                print("Clients initialized successfully.")
-                return True
-            else:
-                print("Failed to initialize OpenSearch client.")
-                return False
-        except Exception as e:
-            print(f"Failed to initialize clients: {e}")
+        # Initialize OpenSearch client
+        if self.opensearch.initialize_opensearch_client():
+            print("OpenSearch client initialized successfully.")
+            return True
+        else:
+            print("Failed to initialize OpenSearch client.")
             return False
 
+
     def process_file(self, file_path: str) -> List[Dict[str, str]]:
         # Process a file based on its extension
         # Supports CSV, TXT, and PDF files
@@ -86,18 +85,16 @@ def process_file(self, file_path: str) -> List[Dict[str, str]]:
 
     def process_csv(self, file_path: str) -> List[Dict[str, str]]:
         # Process a CSV file
-        # Extracts information and formats it into a sentence
-        # Returns a list of dictionaries with the formatted text
+        # Extracts information and returns a list of dictionaries
+        # Each dictionary contains the entire row content
         documents = []
-        with open(file_path, 'r') as csvfile:
+        with open(file_path, 'r', newline='', encoding='utf-8') as csvfile:
             reader = csv.DictReader(csvfile)
             for row in reader:
-                text = f"{row['name']} got nominated under the category, {row['category']}, for the film {row['film']}"
-                if row.get('winner', '').lower() != 'true':
-                    text += " but did not win"
-                documents.append({"text": text})
+                documents.append({"text": json.dumps(row)})
         return documents
 
+
     def process_txt(self, file_path: str) -> List[Dict[str, str]]:
         # Process a TXT file
         # Reads the entire content of the file
@@ -120,40 +117,54 @@ def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
         return documents
 
     def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
-        # Generate text embedding using AWS Bedrock
-        # Implements exponential backoff for retries in case of failures
-        # Returns the embedding if successful, None otherwise
-        if self.bedrock_client is None:
-            print("Bedrock client is not initialized. Please run setup first.")
+        if self.opensearch is None:
+            print("OpenSearch client is not initialized. Please run setup first.")
             return None
-        
+
         delay = initial_delay
         for attempt in range(max_retries):
             try:
-                payload = {"inputText": text}
-                response = self.bedrock_client.invoke_model(modelId=self.EMBEDDING_MODEL_ID, body=json.dumps(payload))
-                response_body = json.loads(response['body'].read())
-                embedding = response_body.get('embedding')
-                if embedding is None:
-                    print(f"No embedding returned for text: {text}")
-                    print(f"Response body: {response_body}")
+                payload = {
+                    "text_docs": [text]
+                }
+                response = self.opensearch.opensearch_client.transport.perform_request(
+                    method="POST",
+                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
+                    body=payload
+                )
+                inference_results = response.get('inference_results', [])
+                if not inference_results:
+                    print(f"No inference results returned for text: {text}")
                     return None
-                return embedding
-            except botocore.exceptions.ClientError as e:
-                error_code = e.response['Error']['Code']
-                error_message = e.response['Error']['Message']
-                print(f"ClientError on attempt {attempt + 1}: {error_code} - {error_message}")
-                if error_code == 'ThrottlingException':
-                    if attempt == max_retries - 1:
-                        raise
-                    time.sleep(delay + random.uniform(0, 1))
-                    delay *= backoff_factor
+                output = inference_results[0].get('output')
+
+                # Remove or comment out the debugging print statements
+                # print(f"Output type: {type(output)}")
+                # print(f"Output content: {output}")
+
+                # Adjust the extraction of embedding data
+                if isinstance(output, list) and len(output) > 0:
+                    embedding_dict = output[0]
+                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
+                        embedding = embedding_dict['data']
+                    else:
+                        print(f"Unexpected embedding output format: {output}")
+                        return None
+                elif isinstance(output, dict) and 'data' in output:
+                    embedding = output['data']
                 else:
-                    raise
+                    print(f"Unexpected embedding output format: {output}")
+                    return None
+
+                # Optionally, you can also remove this print statement if you prefer
+                # print(f"Extracted embedding of length {len(embedding)}")
+                return embedding
             except Exception as ex:
-                print(f"Unexpected error on attempt {attempt + 1}: {ex}")
+                print(f"Error on attempt {attempt + 1}: {ex}")
                 if attempt == max_retries - 1:
                     raise
+                time.sleep(delay)
+                delay *= backoff_factor
         return None
 
     def process_and_ingest_data(self, file_paths: List[str]):
@@ -208,7 +219,7 @@ def process_and_ingest_data(self, file_paths: List[str]):
                     "_index": self.index_name,
                     "_source": {
                         "nominee_text": doc['text'],
-                        "nominee_vector": doc['embedding']
+                        "nominee_vector": doc['embedding']  # This is now a list of floats
                     }
                 }
                 actions.append(action)
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py
deleted file mode 100644
index eca4619c..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_class.py
+++ /dev/null
@@ -1,127 +0,0 @@
-# opensearch_class.py
-
-from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth, exceptions as opensearch_exceptions
-import boto3
-from urllib.parse import urlparse
-from opensearchpy import helpers as opensearch_helpers
-
-class OpenSearchClass:
-    def __init__(self, config):
-        self.config = config
-        self.opensearch_client = None
-        self.aws_region = config.get('region')
-        self.index_name = config.get('index_name')
-        self.is_serverless = config.get('is_serverless', 'False') == 'True'
-        self.opensearch_endpoint = config.get('opensearch_endpoint')
-        self.opensearch_username = config.get('opensearch_username')
-        self.opensearch_password = config.get('opensearch_password')
-
-    def initialize_opensearch_client(self):
-        if not self.opensearch_endpoint:
-            print("OpenSearch endpoint not set. Please run setup first.")
-            return False
-        
-        parsed_url = urlparse(self.opensearch_endpoint)
-        host = parsed_url.hostname
-        port = parsed_url.port or 443
-
-        if self.is_serverless:
-            credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
-        else:
-            if not self.opensearch_username or not self.opensearch_password:
-                print("OpenSearch username or password not set. Please run setup first.")
-                return False
-            auth = (self.opensearch_username, self.opensearch_password)
-
-        try:
-            self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'port': port}],
-                http_auth=auth,
-                use_ssl=True,
-                verify_certs=True,
-                connection_class=RequestsHttpConnection,
-                pool_maxsize=20
-            )
-            print(f"Initialized OpenSearch client with host: {host} and port: {port}")
-            return True
-        except Exception as ex:
-            print(f"Error initializing OpenSearch client: {ex}")
-            return False
-
-    def create_index(self, embedding_dimension, space_type):
-        index_body = {
-            "mappings": {
-                "properties": {
-                    "nominee_text": {"type": "text"},
-                    "nominee_vector": {
-                        "type": "knn_vector",
-                        "dimension": embedding_dimension,
-                        "method": {
-                            "name": "hnsw",
-                            "space_type": space_type,
-                            "engine": "nmslib",
-                            "parameters": {"ef_construction": 512, "m": 16},
-                        },
-                    },
-                }
-            },
-            "settings": {
-                "index": {
-                    "number_of_shards": 2,
-                    "knn.algo_param": {"ef_search": 512},
-                    "knn": True,
-                }
-            },
-        }
-        try:
-            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
-        except opensearch_exceptions.RequestError as e:
-            if 'resource_already_exists_exception' in str(e).lower():
-                print(f"Index '{self.index_name}' already exists.")
-            else:
-                print(f"Error creating index '{self.index_name}': {e}")
-
-    def verify_and_create_index(self, embedding_dimension, space_type):
-        try:
-            index_exists = self.opensearch_client.indices.exists(index=self.index_name)
-            if index_exists:
-                print(f"KNN index '{self.index_name}' already exists.")
-            else:
-                self.create_index(embedding_dimension, space_type)
-            return True
-        except Exception as ex:
-            print(f"Error verifying or creating index: {ex}")
-            return False
-
-    def bulk_index(self, actions):
-        try:
-            success, failed = opensearch_helpers.bulk(self.opensearch_client, actions)
-            print(f"Indexed {success} documents successfully. Failed to index {failed} documents.")
-            return success, failed
-        except Exception as e:
-            print(f"Error during bulk indexing: {e}")
-            return 0, len(actions)
-
-    def search(self, vector, k=5):
-        try:
-            response = self.opensearch_client.search(
-                index=self.index_name,
-                body={
-                    "size": k,
-                    "_source": ["nominee_text"],
-                    "query": {
-                        "knn": {
-                            "nominee_vector": {
-                                "vector": vector,
-                                "k": k
-                            }
-                        }
-                    }
-                }
-            )
-            return response['hits']['hits']
-        except Exception as e:
-            print(f"Error during search: {e}")
-            return []
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 6fb0a5d5..40c48c85 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -36,7 +36,6 @@
 init(autoreset=True)  # Initialize colorama
 
 class Query:
-    EMBEDDING_MODEL_ID = 'amazon.titan-embed-text-v2:0'
     LLM_MODEL_ID = 'amazon.titan-text-express-v1'
 
     def __init__(self, config):
@@ -46,7 +45,7 @@ def __init__(self, config):
         self.index_name = config.get('index_name')
         self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
-
+        self.embedding_model_id = config.get('embedding_model_id')
     def initialize_clients(self):
         # Initialize AWS Bedrock and OpenSearch clients
         # Returns True if successful, False otherwise
@@ -63,40 +62,55 @@ def initialize_clients(self):
             return False
 
     def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
-        # Generate text embedding using AWS Bedrock
-        # Implements exponential backoff for retries in case of failures
-        # Returns the embedding if successful, None otherwise
-        if self.bedrock_client is None:
-            print("Bedrock client is not initialized. Please run setup first.")
+        if self.opensearch is None:
+            print("OpenSearch client is not initialized. Please run setup first.")
             return None
-        
+
         delay = initial_delay
         for attempt in range(max_retries):
             try:
-                payload = {"inputText": text}
-                response = self.bedrock_client.invoke_model(modelId=self.EMBEDDING_MODEL_ID, body=json.dumps(payload))
-                response_body = json.loads(response['body'].read())
-                embedding = response_body.get('embedding')
-                if embedding is None:
-                    print(f"No embedding returned for text: {text}")
-                    print(f"Response body: {response_body}")
+                payload = {
+                    "text_docs": [text]
+                }
+                response = self.opensearch.opensearch_client.transport.perform_request(
+                    method="POST",
+                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
+                    body=payload
+                )
+                inference_results = response.get('inference_results', [])
+                if not inference_results:
+                    print(f"No inference results returned for text: {text}")
                     return None
-                return embedding
-            except botocore.exceptions.ClientError as e:
-                error_code = e.response['Error']['Code']
-                error_message = e.response['Error']['Message']
-                print(f"ClientError on attempt {attempt + 1}: {error_code} - {error_message}")
-                if error_code == 'ThrottlingException':
-                    if attempt == max_retries - 1:
-                        raise
-                    time.sleep(delay + random.uniform(0, 1))
-                    delay *= backoff_factor
+                output = inference_results[0].get('output')
+
+                # Adjust the extraction of embedding data
+                if isinstance(output, list) and len(output) > 0:
+                    embedding_dict = output[0]
+                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
+                        embedding = embedding_dict['data']
+                    else:
+                        print(f"Unexpected embedding output format: {output}")
+                        return None
+                elif isinstance(output, dict) and 'data' in output:
+                    embedding = output['data']
                 else:
-                    raise
+                    print(f"Unexpected embedding output format: {output}")
+                    return None
+
+                # Verify that embedding is a list of floats
+                if not isinstance(embedding, list) or not all(isinstance(x, (float, int)) for x in embedding):
+                    print(f"Embedding is not a list of floats: {embedding}")
+                    return None
+
+                # Optionally, remove debugging print statements
+                # print(f"Extracted embedding of length {len(embedding)}")
+                return embedding
             except Exception as ex:
-                print(f"Unexpected error on attempt {attempt + 1}: {ex}")
+                print(f"Error on attempt {attempt + 1}: {ex}")
                 if attempt == max_retries - 1:
                     raise
+                time.sleep(delay)
+                delay *= backoff_factor
         return None
 
     def bulk_query(self, queries, k=5):
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index b9b09ef1..4335f606 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -26,7 +26,6 @@
 #  under the License.
 
 
-
 """
 Main CLI script for OpenSearch with Bedrock Integration
 """
@@ -55,7 +54,7 @@ def save_config(config):
 def main():
     # Set up argument parser for CLI
     parser = argparse.ArgumentParser(description="RAG Pipeline CLI")
-    parser.add_argument('command', choices=['setup', 'ingest', 'query'], help='Command to run')
+    parser.add_argument('command', choices=['setup', 'register_model', 'ingest', 'query'], help='Command to run')
     parser.add_argument('--paths', nargs='+', help='Paths to files or directories for ingestion')
     parser.add_argument('--queries', nargs='+', help='Query texts for search and answer generation')
     parser.add_argument('--num_results', type=int, default=5, help='Number of top results to retrieve for each query')
@@ -70,6 +69,11 @@ def main():
         setup = Setup()
         setup.setup_command()
         save_config(setup.config)
+    elif args.command == 'register_model':
+        # Run model registration process
+        setup = Setup()
+        setup.register_model_command()
+        save_config(setup.config)
     elif args.command == 'ingest':
         # Handle ingestion command
         if not args.paths:
@@ -103,4 +107,4 @@ def main():
         parser.print_help()
 
 if __name__ == "__main__":
-    main()
+    main()
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index d75d8eb7..e32f7746 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -36,6 +36,7 @@
 import sys
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
+from AIConnectorHelper import AIConnectorHelper
 
 # [Existing license and import statements remain unchanged]
 
@@ -45,18 +46,22 @@ class Setup:
     SERVICE_BEDROCK = 'bedrock-runtime'
 
     def __init__(self):
-        # Initialize setup variables
-        self.aws_region = None
-        self.iam_principal = None
-        self.index_name = None
-        self.collection_name = None
-        self.opensearch_endpoint = None
-        self.is_serverless = None
-        self.opensearch_username = None
-        self.opensearch_password = None
-        self.aoss_client = None
-        self.bedrock_client = None
-        self.opensearch_client = None
+            # Initialize setup variables
+            self.config = self.load_config()
+            self.aws_region = self.config.get('region')
+            self.iam_principal = self.config.get('iam_principal')
+            self.index_name = self.config.get('index_name')
+            self.collection_name = self.config.get('collection_name', '')
+            self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
+            self.is_serverless = self.config.get('is_serverless', 'False') == 'True'
+            self.opensearch_username = self.config.get('opensearch_username', '')
+            self.opensearch_password = self.config.get('opensearch_password', '')
+            self.aoss_client = None
+            self.bedrock_client = None
+            self.opensearch_client = None
+
+            # Initialize opensearch_domain_name
+            self.opensearch_domain_name = self.get_opensearch_domain_name()
 
     def check_and_configure_aws(self):
         # Check if AWS credentials are configured and offer to reconfigure if needed
@@ -309,6 +314,39 @@ def get_collection_id(self, collection_name):
         except Exception as ex:
             print(f"Error getting collection ID: {ex}")
         return None
+    def get_opensearch_domain_name(self):
+        """
+        Extract the domain name from the OpenSearch endpoint URL.
+        """
+        if self.opensearch_endpoint:
+            parsed_url = urlparse(self.opensearch_endpoint)
+            hostname = parsed_url.hostname  # e.g., 'search-your-domain-name-uniqueid.region.es.amazonaws.com'
+            if hostname:
+                # Split the hostname into parts
+                parts = hostname.split('.')
+                domain_part = parts[0]  # e.g., 'search-your-domain-name-uniqueid'
+                # Remove the 'search-' prefix if present
+                if domain_part.startswith('search-'):
+                    domain_part = domain_part[len('search-'):]
+                # Remove the unique ID suffix after the domain name
+                domain_name = domain_part.rsplit('-', 1)[0]
+                print(f"Extracted domain name: {domain_name}")
+                return domain_name
+        return None
+    def get_opensearch_domain_info(region, domain_name):
+        """
+        Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
+        """
+        try:
+            client = boto3.client('opensearch', region_name=region)
+            response = client.describe_domain(DomainName=domain_name)
+            domain_status = response['DomainStatus']
+            domain_endpoint = domain_status.get('Endpoint') or domain_status.get('Endpoints', {}).get('vpc')
+            domain_arn = domain_status['ARN']
+            return domain_endpoint, domain_arn
+        except Exception as e:
+            print(f"Error retrieving OpenSearch domain info: {e}")
+            return None, None
 
     def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
         # Wait for the collection to become active
@@ -361,7 +399,16 @@ def get_collection_endpoint(self):
         except Exception as ex:
             print(f"Error retrieving collection endpoint: {ex}")
             return None
-
+    def get_iam_user_name_from_arn(self, iam_principal_arn):
+        """
+        Extract the IAM user name from the IAM principal ARN.
+        """
+        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
+        if iam_principal_arn and ':user/' in iam_principal_arn:
+            return iam_principal_arn.split(':user/')[-1]
+        else:
+            return None
+        
     def initialize_opensearch_client(self):
         # Initialize the OpenSearch client
         if not self.opensearch_endpoint:
@@ -529,6 +576,9 @@ def setup_command(self):
                         return
                     else:
                         self.config['opensearch_endpoint'] = self.opensearch_endpoint
+                        self.save_config(self.config)
+                        # Initialize opensearch_domain_name after setting opensearch_endpoint
+                        self.opensearch_domain_name = self.get_opensearch_domain_name()
                 else:
                     print("Collection is not active. Setup incomplete.")
                     return
@@ -536,6 +586,9 @@ def setup_command(self):
             if not self.opensearch_endpoint:
                 print("OpenSearch endpoint not set. Setup incomplete.")
                 return
+            else:
+                # Initialize opensearch_domain_name after setting opensearch_endpoint
+                self.opensearch_domain_name = self.get_opensearch_domain_name()
         
         if self.initialize_opensearch_client():
             print("OpenSearch client initialized successfully. Proceeding with index creation...")
@@ -545,7 +598,353 @@ def setup_command(self):
                 self.config['embedding_dimension'] = str(embedding_dimension)
                 self.config['space_type'] = space_type
                 self.config['ef_construction'] = str(ef_construction)
+                self.save_config(self.config)
             else:
                 print("Index verification failed. Please check your index name and permissions.")
         else:
-            print("Failed to initialize OpenSearch client. Setup incomplete.")
\ No newline at end of file
+            print("Failed to initialize OpenSearch client. Setup incomplete.")
+
+    def register_model_command(self):
+        """
+        Command method to register a new embedding model.
+        Prompts the user to select a model and gathers necessary inputs.
+        """
+        # Load existing config
+        self.config = self.load_config()
+
+        # Initialize clients
+        if not self.initialize_clients():
+            print("Failed to initialize AWS clients. Cannot proceed.")
+            return
+
+        # Ensure opensearch_endpoint is set
+        if not self.opensearch_endpoint:
+            self.opensearch_endpoint = self.config.get('opensearch_endpoint')
+            if not self.opensearch_endpoint:
+                print("OpenSearch endpoint not set. Please run 'setup' command first.")
+                return
+
+        # Initialize opensearch_domain_name
+        self.opensearch_domain_name = self.get_opensearch_domain_name()
+
+        # Extract the IAM user name from the IAM principal ARN
+        aws_user_name = self.get_iam_user_name_from_arn(self.iam_principal)
+
+        if not aws_user_name:
+            print("Could not extract IAM user name from IAM principal ARN.")
+            aws_user_name = input("Enter your AWS IAM user name: ")
+
+        # Instantiate AIConnectorHelper
+        helper = AIConnectorHelper(
+            region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_domain_username=self.opensearch_username,
+            opensearch_domain_password=self.opensearch_password,
+            aws_user_name=aws_user_name,
+            aws_role_name=None  # Set to None or provide if applicable
+        )
+        
+
+        # Prompt user to select a model
+        print("Please select an embedding model to register:")
+        print("1. Bedrock Titan Embedding Model")
+        print("2. SageMaker Embedding Model")
+        print("3. Cohere Embedding Model")
+        print("4. OpenAI Embedding Model")
+        model_choice = input("Enter your choice (1-4): ")
+
+        # Call the appropriate method based on the user's choice
+        if model_choice == '1':
+            self.register_bedrock_model(helper)
+        elif model_choice == '2':
+            self.register_sagemaker_model(helper)
+        elif model_choice == '3':
+            self.register_cohere_model(helper)
+        elif model_choice == '4':
+            self.register_openai_model(helper)
+        else:
+            print("Invalid choice. Exiting.")
+            return
+        
+    def register_bedrock_model(self, helper):
+        """
+        Register a Bedrock embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
+        connector_role_name = "my_test_bedrock_connector_role"
+        create_connector_role_name = "my_test_create_bedrock_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["bedrock:InvokeModel"],
+                    "Effect": "Allow",
+                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
+                }
+            ]
+        }
+
+        # Create connector input
+        create_connector_input = {
+            "name": "Amazon Bedrock Connector: titan embedding v1",
+            "description": "The connector to Bedrock Titan embedding model",
+            "version": 1,
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": bedrock_region,
+                "service_name": "bedrock"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
+                    "headers": {
+                        "content-type": "application/json",
+                        "x-amz-content-sha256": "required"
+                    },
+                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
+                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
+                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print("Failed to create connector. Aborting.")
+            return
+
+        # Register model
+# Register model
+        model_name = 'Bedrock embedding model'
+        description = 'Bedrock embedding model for semantic search'
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print("Failed to create model. Aborting.")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"Model registered successfully. Model ID: {model_id}")
+
+    def register_sagemaker_model(self, helper):
+        """
+        Register a SageMaker embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ")
+        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ")
+        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ") or self.aws_region
+        connector_role_name = "my_test_sagemaker_connector_role"
+        create_connector_role_name = "my_test_create_sagemaker_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["sagemaker:InvokeEndpoint"],
+                    "Effect": "Allow",
+                    "Resource": sagemaker_endpoint_arn
+                }
+            ]
+        }
+
+        # Create connector input
+        create_connector_input = {
+            "name": "SageMaker embedding model connector",
+            "description": "Connector for my SageMaker embedding model",
+            "version": "1.0",
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": sagemaker_region,
+                "service_name": "sagemaker"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "headers": {
+                        "content-type": "application/json"
+                    },
+                    "url": sagemaker_endpoint_url,
+                    "request_body": "${parameters.input}",
+                    "pre_process_function": "connector.pre_process.default.embedding",
+                    "post_process_function": "connector.post_process.default.embedding"
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print("Failed to create connector. Aborting.")
+            return
+
+        # Register model
+        model_name = 'SageMaker embedding model'
+        description = 'SageMaker embedding model for semantic search'
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print("Failed to create model. Aborting.")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"Model registered successfully. Model ID: {model_id}")
+
+    def register_cohere_model(self, helper):
+        """
+        Register a Cohere embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'cohere_api_key'
+        cohere_api_key = input("Enter your Cohere API key: ")
+        secret_value = {secret_key: cohere_api_key}
+
+        connector_role_name = "my_test_cohere_connector_role"
+        create_connector_role_name = "my_test_create_cohere_connector_role"
+
+        # Create connector input
+        create_connector_input = {
+            "name": "Cohere Embedding Model Connector",
+            "description": "Connector for Cohere embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "embed-english-v3.0",
+                "input_type": "search_document",
+                "truncate": "END"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.cohere.ai/v1/embed",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                        "Request-Source": "unspecified:opensearch"
+                    },
+                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                    "pre_process_function": "connector.pre_process.cohere.embedding",
+                    "post_process_function": "connector.post_process.cohere.embedding"
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print("Failed to create connector. Aborting.")
+            return
+
+        # Register model
+        model_name = 'Cohere embedding model'
+        description = 'Cohere embedding model for semantic search'
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print("Failed to create model. Aborting.")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"Model registered successfully. Model ID: {model_id}")
+
+    def register_openai_model(self, helper):
+        """
+        Register an OpenAI embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'openai_api_key'
+        openai_api_key = input("Enter your OpenAI API key: ")
+        secret_value = {secret_key: openai_api_key}
+
+        connector_role_name = "my_test_openai_connector_role"
+        create_connector_role_name = "my_test_create_openai_connector_role"
+
+        # Create connector input
+        create_connector_input = {
+            "name": "OpenAI Embedding Model Connector",
+            "description": "Connector for OpenAI embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "text-embedding-ada-002"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.openai.com/v1/embeddings",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                    },
+                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                    "pre_process_function": "connector.pre_process.openai.embedding",
+                    "post_process_function": "connector.post_process.openai.embedding"
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print("Failed to create connector. Aborting.")
+            return
+
+        # Register model
+        model_name = 'OpenAI embedding model'
+        description = 'OpenAI embedding model for semantic search'
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print("Failed to create model. Aborting.")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"Model registered successfully. Model ID: {model_id}")
\ No newline at end of file

From 263575139a905b002e92f95a64bedafe1ad0eb81 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 21 Nov 2024 01:57:16 -0800
Subject: [PATCH 07/42] Sign-off on all previous work

This commit serves as a blanket sign-off for all previous commits in this pull request,
in compliance with the Developer Certificate of Origin (DCO).

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>

From 88cf68b17ec52277a946efa14c48dd5e600968f7 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 22 Nov 2024 01:51:22 -0800
Subject: [PATCH 08/42] Enhance RAG pipeline functionality and user experience

- Add functionality for users to upload entire folders by specifying a file path, enabling batch processing of multiple files
- Show path to config file
- Implement a visual confirmation system for setup completion, using red/green indicators similar to the document ingestion process
- Combine the RAG setup and model registration into one unified process, prompting users if they want to register a model, offering options or if CX wants to use their already made custom model ID input, and providing clear confirmation when a model ID is saved, all while streamlining the overall setup for improved user experience
- Update user interface starting from setup

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/ingest.py     |   4 +-
 .../ml_commons/rag_pipeline/rag/rag.py        | 161 ++++++++++++++----
 .../ml_commons/rag_pipeline/rag/rag_setup.py  |  94 ++++++----
 3 files changed, 188 insertions(+), 71 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 38103251..c1372505 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -236,7 +236,9 @@ def ingest_command(self, paths: List[str]):
             if os.path.isfile(path):
                 all_files.append(path)
             elif os.path.isdir(path):
-                all_files.extend(glob.glob(os.path.join(path, '*')))
+                for root, dirs, files in os.walk(path):
+                    for file in files:
+                        all_files.append(os.path.join(root, file))
             else:
                 print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
         
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 4335f606..0e86bf15 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -4,27 +4,25 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors.
+# See GitHub history for details.
 
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
+# Licensed to Elasticsearch B.V. under one or more contributor
+# license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright
+# ownership. Elasticsearch B.V. licenses this file to you under
+# the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
 #
-# 	http://www.apache.org/licenses/LICENSE-2.0
+#   http://www.apache.org/licenses/LICENSE-2.0
 #
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
 
 """
 Main CLI script for OpenSearch with Bedrock Integration
@@ -32,60 +30,144 @@
 
 import argparse
 import configparser
+import sys
+from colorama import Fore, Style, init
+from rich.console import Console
+from rich.prompt import Prompt
 from rag_setup import Setup
 from ingest import Ingest
 from query import Query
 
+# Initialize colorama
+init(autoreset=True)
+
+# Initialize Rich console
+console = Console()
+
 CONFIG_FILE = 'config.ini'
 
+
 def load_config():
-    # Load configuration from the config file
+    """
+    Load configuration from the config file.
+    """
     config = configparser.ConfigParser()
     config.read(CONFIG_FILE)
+    if 'DEFAULT' not in config:
+        console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] 'DEFAULT' section missing in {CONFIG_FILE}. Please run the setup command first.")
+        sys.exit(1)
     return config['DEFAULT']
 
+
 def save_config(config):
-    # Save configuration to the config file
+    """
+    Save configuration to the config file.
+    """
     parser = configparser.ConfigParser()
     parser['DEFAULT'] = config
-    with open(CONFIG_FILE, 'w') as f:
-        parser.write(f)
-    
+    try:
+        with open(CONFIG_FILE, 'w') as f:
+            parser.write(f)
+        console.print(f"[{Fore.GREEN}SUCCESS{Style.RESET_ALL}] Configuration saved to {CONFIG_FILE}.")
+    except Exception as e:
+        console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] Failed to save configuration: {e}")
+
+
 def main():
-    # Set up argument parser for CLI
-    parser = argparse.ArgumentParser(description="RAG Pipeline CLI")
-    parser.add_argument('command', choices=['setup', 'register_model', 'ingest', 'query'], help='Command to run')
-    parser.add_argument('--paths', nargs='+', help='Paths to files or directories for ingestion')
-    parser.add_argument('--queries', nargs='+', help='Query texts for search and answer generation')
-    parser.add_argument('--num_results', type=int, default=5, help='Number of top results to retrieve for each query')
+    """
+    Main function to parse arguments and execute commands.
+    """
+    # Set up argument parser for CLI with Rich help formatting
+    parser = argparse.ArgumentParser(
+        description="RAG Pipeline CLI",
+        formatter_class=argparse.RawTextHelpFormatter,
+        epilog="""
+Examples:
+Initialize the setup:
+  rag setup
+
+Ingest documents from multiple paths:
+  rag ingest --paths /data/docs /data/reports
+
+Execute queries with default number of results:
+  rag query --queries "What is OpenSearch?" "How does Bedrock work?"
 
+Execute queries with a specified number of results:
+  rag query --queries "What is OpenSearch?" --num_results 3
+"""
+    )
+    subparsers = parser.add_subparsers(title="Available Commands", dest="command")
+
+    # Setup command
+    setup_parser = subparsers.add_parser(
+        'setup',
+        help='Initialize and configure the RAG pipeline.'
+    )
+
+    # Ingest command
+    ingest_parser = subparsers.add_parser(
+        'ingest',
+        help='Ingest documents into OpenSearch.'
+    )
+    ingest_parser.add_argument(
+        '--paths',
+        nargs='+',
+        help='Paths to files or directories for ingestion.'
+    )
+
+    # Query command
+    query_parser = subparsers.add_parser(
+        'query',
+        help='Execute queries and generate answers.'
+    )
+    query_parser.add_argument(
+        '--queries',
+        nargs='+',
+        help='Query texts for search and answer generation.'
+    )
+    query_parser.add_argument(
+        '--num_results',
+        type=int,
+        default=5,
+        help='Number of top results to retrieve for each query. (default: 5)'
+    )
+
+    # Parse arguments
     args = parser.parse_args()
 
+    # Only display the banner if no command is executed
+    if not args.command:
+        console.print("[bold cyan]Welcome to the RAG Pipeline[/bold cyan]")
+        console.print("Use [bold blue]rag setup[/bold blue], [bold blue]rag ingest[/bold blue], or [bold blue]rag query[/bold blue] to begin.\n")
+
     # Load existing configuration
-    config = load_config()
+    if args.command != 'setup' and args.command:
+        config = load_config()
+    else:
+        config = None  # Setup may create the config
 
+    # Handle commands
     if args.command == 'setup':
         # Run setup process
         setup = Setup()
+        console.print("[bold blue]Starting setup process...[/bold blue]")
         setup.setup_command()
         save_config(setup.config)
-    elif args.command == 'register_model':
-        # Run model registration process
-        setup = Setup()
-        setup.register_model_command()
-        save_config(setup.config)
     elif args.command == 'ingest':
         # Handle ingestion command
         if not args.paths:
             # If no paths provided as arguments, prompt user for input
             paths = []
             while True:
-                path = input("Enter a file or directory path (or press Enter to finish): ")
+                path = Prompt.ask("Enter a file or directory path (or press Enter to finish)", default="", show_default=False)
                 if not path:
                     break
                 paths.append(path)
         else:
             paths = args.paths
+        if not paths:
+            console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] No paths provided for ingestion. Aborting.")
+            sys.exit(1)
         ingest = Ingest(config)
         ingest.ingest_command(paths)
     elif args.command == 'query':
@@ -94,17 +176,22 @@ def main():
             # If no queries provided as arguments, prompt user for input
             queries = []
             while True:
-                query = input("Enter a query (or press Enter to finish): ")
+                query = Prompt.ask("Enter a query (or press Enter to finish)", default="", show_default=False)
                 if not query:
                     break
                 queries.append(query)
         else:
             queries = args.queries
+        if not queries:
+            console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] No queries provided. Aborting.")
+            sys.exit(1)
         query = Query(config)
         query.query_command(queries, num_results=args.num_results)
     else:
         # If an invalid command is provided, print help
         parser.print_help()
+        sys.exit(1)
+
 
 if __name__ == "__main__":
     main()
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index e32f7746..983ef7e9 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -37,9 +37,9 @@
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
 from AIConnectorHelper import AIConnectorHelper
+from colorama import Fore, Style, init
 
-# [Existing license and import statements remain unchanged]
-
+init(autoreset=True)
 class Setup:
     CONFIG_FILE = 'config.ini'
     SERVICE_AOSS = 'opensearchserverless'
@@ -59,8 +59,6 @@ def __init__(self):
             self.aoss_client = None
             self.bedrock_client = None
             self.opensearch_client = None
-
-            # Initialize opensearch_domain_name
             self.opensearch_domain_name = self.get_opensearch_domain_name()
 
     def check_and_configure_aws(self):
@@ -558,21 +556,21 @@ def setup_command(self):
         self.setup_configuration()
         
         if not self.initialize_clients():
-            print("Failed to initialize AWS clients. Setup incomplete.")
+            print(f"{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}")
             return
         
         if self.is_serverless:
             self.create_security_policies()
             collection_id = self.get_collection_id(self.collection_name)
             if not collection_id:
-                print(f"Collection '{self.collection_name}' not found. Attempting to create it...")
+                print(f"{Fore.YELLOW}Collection '{self.collection_name}' not found. Attempting to create it...{Style.RESET_ALL}")
                 collection_id = self.create_collection(self.collection_name)
             
             if collection_id:
                 if self.wait_for_collection_active(collection_id):
                     self.opensearch_endpoint = self.get_collection_endpoint()
                     if not self.opensearch_endpoint:
-                        print("Failed to retrieve OpenSearch endpoint. Setup incomplete.")
+                        print(f"{Fore.RED}Failed to retrieve OpenSearch endpoint. Setup incomplete.{Style.RESET_ALL}")
                         return
                     else:
                         self.config['opensearch_endpoint'] = self.opensearch_endpoint
@@ -580,48 +578,75 @@ def setup_command(self):
                         # Initialize opensearch_domain_name after setting opensearch_endpoint
                         self.opensearch_domain_name = self.get_opensearch_domain_name()
                 else:
-                    print("Collection is not active. Setup incomplete.")
+                    print(f"{Fore.RED}Collection is not active. Setup incomplete.{Style.RESET_ALL}")
                     return
         else:
             if not self.opensearch_endpoint:
-                print("OpenSearch endpoint not set. Setup incomplete.")
+                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}")
                 return
             else:
                 # Initialize opensearch_domain_name after setting opensearch_endpoint
                 self.opensearch_domain_name = self.get_opensearch_domain_name()
         
         if self.initialize_opensearch_client():
-            print("OpenSearch client initialized successfully. Proceeding with index creation...")
+            print(f"{Fore.GREEN}OpenSearch client initialized successfully. Proceeding with index creation...{Style.RESET_ALL}")
             embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
             if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
-                print("Setup completed successfully.")
+                print(f"{Fore.GREEN}KNN index setup completed successfully.{Style.RESET_ALL}")
                 self.config['embedding_dimension'] = str(embedding_dimension)
                 self.config['space_type'] = space_type
                 self.config['ef_construction'] = str(ef_construction)
                 self.save_config(self.config)
+                config_file_path = os.path.abspath(self.CONFIG_FILE)
+                print(f"{Fore.GREEN}Configuration saved successfully at {config_file_path}{Style.RESET_ALL}")
+                
+                # Ask the user if they want to register a model
+                self.prompt_model_registration()
+            else:
+                print(f"{Fore.RED}Index verification failed. Please check your index name and permissions.{Style.RESET_ALL}")
+        else:
+            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}")
+
+    def prompt_model_registration(self):
+        """
+        Prompt the user to register a model or input an existing model ID.
+        """
+        print("\nWould you like to register an embedding model now?")
+        print("1. Yes, register a new model")
+        print("2. No, I already have a model ID")
+        print("3. Skip this step")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            self.register_model_interactive()
+        elif choice == '2':
+            model_id = input("Please enter your existing embedding model ID: ").strip()
+            if model_id:
+                self.config['embedding_model_id'] = model_id
+                self.save_config(self.config)
+                print(f"{Fore.GREEN}Model ID '{model_id}' saved successfully in configuration.{Style.RESET_ALL}")
             else:
-                print("Index verification failed. Please check your index name and permissions.")
+                print(f"{Fore.RED}No model ID provided. Skipping model registration.{Style.RESET_ALL}")
         else:
-            print("Failed to initialize OpenSearch client. Setup incomplete.")
+            print("Skipping model registration.")
 
-    def register_model_command(self):
+    def register_model_interactive(self):
         """
-        Command method to register a new embedding model.
-        Prompts the user to select a model and gathers necessary inputs.
+        Interactive method to register a new embedding model during setup.
         """
         # Load existing config
         self.config = self.load_config()
 
         # Initialize clients
         if not self.initialize_clients():
-            print("Failed to initialize AWS clients. Cannot proceed.")
+            print(f"{Fore.RED}Failed to initialize AWS clients. Cannot proceed.{Style.RESET_ALL}")
             return
 
         # Ensure opensearch_endpoint is set
         if not self.opensearch_endpoint:
             self.opensearch_endpoint = self.config.get('opensearch_endpoint')
             if not self.opensearch_endpoint:
-                print("OpenSearch endpoint not set. Please run 'setup' command first.")
+                print(f"{Fore.RED}OpenSearch endpoint not set. Please run 'setup' command first.{Style.RESET_ALL}")
                 return
 
         # Initialize opensearch_domain_name
@@ -643,7 +668,6 @@ def register_model_command(self):
             aws_user_name=aws_user_name,
             aws_role_name=None  # Set to None or provide if applicable
         )
-        
 
         # Prompt user to select a model
         print("Please select an embedding model to register:")
@@ -663,7 +687,7 @@ def register_model_command(self):
         elif model_choice == '4':
             self.register_openai_model(helper)
         else:
-            print("Invalid choice. Exiting.")
+            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
             return
         
     def register_bedrock_model(self, helper):
@@ -714,6 +738,7 @@ def register_bedrock_model(self, helper):
         }
 
         # Create connector
+        print("Creating connector...")
         connector_id = helper.create_connector_with_role(
             connector_role_inline_policy,
             connector_role_name,
@@ -723,23 +748,24 @@ def register_bedrock_model(self, helper):
         )
 
         if not connector_id:
-            print("Failed to create connector. Aborting.")
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
             return
 
         # Register model
-# Register model
+        print("Registering model...")
         model_name = 'Bedrock embedding model'
         description = 'Bedrock embedding model for semantic search'
         model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
 
         if not model_id:
-            print("Failed to create model. Aborting.")
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
         self.config['embedding_model_id'] = model_id
         self.save_config(self.config)
-        print(f"Model registered successfully. Model ID: {model_id}")
+        print(f"{Fore.GREEN}Model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+
 
     def register_sagemaker_model(self, helper):
         """
@@ -799,7 +825,7 @@ def register_sagemaker_model(self, helper):
         )
 
         if not connector_id:
-            print("Failed to create connector. Aborting.")
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
             return
 
         # Register model
@@ -808,13 +834,14 @@ def register_sagemaker_model(self, helper):
         model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
 
         if not model_id:
-            print("Failed to create model. Aborting.")
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
         self.config['embedding_model_id'] = model_id
         self.save_config(self.config)
-        print(f"Model registered successfully. Model ID: {model_id}")
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+
 
     def register_cohere_model(self, helper):
         """
@@ -867,7 +894,7 @@ def register_cohere_model(self, helper):
         )
 
         if not connector_id:
-            print("Failed to create connector. Aborting.")
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
             return
 
         # Register model
@@ -876,13 +903,14 @@ def register_cohere_model(self, helper):
         model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
 
         if not model_id:
-            print("Failed to create model. Aborting.")
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
         self.config['embedding_model_id'] = model_id
         self.save_config(self.config)
-        print(f"Model registered successfully. Model ID: {model_id}")
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+
 
     def register_openai_model(self, helper):
         """
@@ -932,7 +960,7 @@ def register_openai_model(self, helper):
         )
 
         if not connector_id:
-            print("Failed to create connector. Aborting.")
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
             return
 
         # Register model
@@ -941,10 +969,10 @@ def register_openai_model(self, helper):
         model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
 
         if not model_id:
-            print("Failed to create model. Aborting.")
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
         self.config['embedding_model_id'] = model_id
         self.save_config(self.config)
-        print(f"Model registered successfully. Model ID: {model_id}")
\ No newline at end of file
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")

From ad1ea973974245c21ac793ec9e57d6706a66381f Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Sun, 24 Nov 2024 20:06:23 -0800
Subject: [PATCH 09/42] Created Ingest Pipline for chunking.- Merge custom
 setup.py with the pre-existing one, allowing users to run a single setup
 process - Update requirements.txt to support RAG dependencies

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/ingest.py     | 39 ++++++++++++++++++-
 requirements.txt                              | 17 ++++++--
 setup.py                                      | 39 ++++++++++++++-----
 3 files changed, 81 insertions(+), 14 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index c1372505..7b766939 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -36,6 +36,7 @@
 import botocore
 import time
 import random
+from opensearchpy import exceptions as opensearch_exceptions 
 
 
 from opensearch_connector import OpenSearchConnector
@@ -166,6 +167,38 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
                 time.sleep(delay)
                 delay *= backoff_factor
         return None
+    def create_ingest_pipeline(self):
+        pipeline_id = 'text-chunking-ingest-pipeline'
+        # Check if pipeline exists
+        try:
+            response = self.opensearch.opensearch_client.ingest.get_pipeline(id=pipeline_id)
+            print(f"Ingest pipeline '{pipeline_id}' already exists.")
+        except opensearch_exceptions.NotFoundError:
+            # Pipeline does not exist, create it
+            pipeline_body = {
+                "description": "A text chunking ingest pipeline",
+                "processors": [
+                    {
+                        "text_chunking": {
+                            "algorithm": {
+                                "fixed_token_length": {
+                                    "token_limit": 384,
+                                    "overlap_rate": 0.2,
+                                    "tokenizer": "standard"
+                                }
+                            },
+                            "field_map": {
+                                "nominee_text": "passage_chunk"
+                            }
+                        }
+                    }
+                ]
+            }
+            self.opensearch.opensearch_client.ingest.put_pipeline(id=pipeline_id, body=pipeline_body)
+            print(f"Ingest pipeline '{pipeline_id}' created successfully.")
+        except Exception as e:
+            print(f"Error checking or creating ingest pipeline: {e}")
+
 
     def process_and_ingest_data(self, file_paths: List[str]):
         # Process and ingest data from multiple files
@@ -175,6 +208,9 @@ def process_and_ingest_data(self, file_paths: List[str]):
             print("Failed to initialize clients. Aborting ingestion.")
             return
 
+        # Create the ingest pipeline
+        self.create_ingest_pipeline()
+
         all_documents = []
         for file_path in file_paths:
             print(f"Processing file: {file_path}")
@@ -220,7 +256,8 @@ def process_and_ingest_data(self, file_paths: List[str]):
                     "_source": {
                         "nominee_text": doc['text'],
                         "nominee_vector": doc['embedding']  # This is now a list of floats
-                    }
+                    },
+                    "_pipeline": 'text-chunking-ingest-pipeline'  # Specify the ingest pipeline here
                 }
                 actions.append(action)
         
diff --git a/requirements.txt b/requirements.txt
index cddfe801..3a455e4e 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,5 @@
-#
 # Basic requirements
-#
-pandas>=1.5.2,<2
+pandas>=1.5.2,<3
 matplotlib>=3.6.2,<4
 numpy>=1.24.0,<2
 opensearch-py>=2.2.0
@@ -9,6 +7,17 @@ torch>=2.0.1,<2.1.0
 onnx>=1.15.0
 accelerate>=0.27
 sentence_transformers>=2.5.0,<2.6
-tqdm>4.66.0,<5
+tqdm>=4.66.0,<5
 transformers>=4.36.0,<5
 deprecated>=1.2.14,<2
+
+# Additional requirements for the RAG pipeline
+boto3>=1.26.0
+botocore>=1.29.0
+requests>=2.28.0
+requests-aws4auth>=1.1.0
+colorama>=0.4.6
+PyPDF2>=3.0.1
+rich>=13.5.2
+tiktoken>=0.5.0
+# termios is a standard library module; no need to include it in requirements
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 9146b250..b1ecb39b 100644
--- a/setup.py
+++ b/setup.py
@@ -25,11 +25,10 @@
 
 # flake8: noqa
 
+from setuptools import setup, find_packages, find_namespace_packages
 from codecs import open
 from os import path
 
-from setuptools import find_packages, setup
-
 here = path.abspath(path.dirname(__file__))
 about = {}
 with open(path.join(here, "opensearch_py_ml", "_version.py"), "r", "utf-8") as f:
@@ -71,27 +70,49 @@
     long_description_content_type="text/markdown",
     url=about["__url__"],
     author=about["__author__"],
-    author_email=about["__author_email__"],
+    author_email=about["__author_email"],
     maintainer=about["__maintainer__"],
-    maintainer_email=about["__maintainer_email__"],
+    maintainer_email=about["__maintainer_email"],
     license="Apache-2.0",
     classifiers=CLASSIFIERS,
     keywords="Opensearch opensearch_py_ml pandas python",
-    packages=find_packages(include=["opensearch_py_ml", "opensearch_py_ml.*"]),
+    packages=find_namespace_packages(include=["opensearch_py_ml", "opensearch_py_ml.*"]),
     project_urls={
         "Source Code": "https://github.com/opensearch-project/opensearch-py-ml",
         "Issue Tracker": "https://github.com/opensearch-project/opensearch-py-ml/issues",
     },
     install_requires=[
-        "opensearch-py>=2",
-        "pandas>=1.5,<3",
-        "matplotlib>=3.6.0,<4",
+        "opensearch-py>=2.2.0",
+        "pandas>=1.5.2,<3",
+        "matplotlib>=3.6.2,<4",
         "numpy>=1.24.0,<2",
+        "torch>=2.0.1,<2.1.0",
+        "onnx>=1.15.0",
+        "accelerate>=0.27",
+        "sentence_transformers>=2.5.0,<2.6",
+        "tqdm>=4.66.0,<5",
+        "transformers>=4.36.0,<5",
         "deprecated>=1.2.14,<2",
+        # Additional dependencies for the RAG pipeline
+        "boto3>=1.26.0",
+        "botocore>=1.29.0",
+        "requests>=2.28.0",
+        "requests-aws4auth>=1.1.0",
+        "colorama>=0.4.6",
+        "PyPDF2>=3.0.1",
+        "rich>=13.5.2",
+        "tiktoken>=0.5.0",
+        "termios>=1.0",
     ],
     python_requires=">=3.8",
     package_data={"opensearch_py_ml": ["py.typed"]},
     include_package_data=True,
     zip_safe=False,
     extras_require=extras,
-)
+    # Entry points for console scripts
+    entry_points={
+        'console_scripts': [
+            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
+        ],
+    },
+)
\ No newline at end of file

From da0ce7ce3fa667811dd0ab3e5f7dd1f59aa1317f Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 28 Nov 2024 22:49:30 -0800
Subject: [PATCH 10/42] Removed hard coded LLM model, allowed for Opensoure
 integration, users can now specify their model payload through JSON object

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/AIConnectorHelper.py     |  546 +++------
 .../rag_pipeline/rag/IAMRoleHelper.py         |  190 +++
 .../rag_pipeline/rag/SecretsHelper.py         |   81 ++
 .../ml_commons/rag_pipeline/rag/ingest.py     |    8 +-
 .../rag_pipeline/rag/model_register.py        | 1058 +++++++++++++++++
 .../rag_pipeline/rag/opensearch_connector.py  |   46 +-
 .../ml_commons/rag_pipeline/rag/query.py      |  273 ++---
 .../ml_commons/rag_pipeline/rag/rag.py        |    2 +-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  |  565 +++------
 9 files changed, 1778 insertions(+), 991 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index efe62896..1218a589 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -23,9 +22,7 @@
 #  specific language governing permissions and limitations
 #  under the License.
 
-
 import boto3
-from botocore.exceptions import BotoCoreError
 import json
 import requests
 from requests.auth import HTTPBasicAuth
@@ -33,7 +30,9 @@
 import time
 from opensearchpy import OpenSearch, RequestsHttpConnection
 
-# This Python code is compatible with AWS OpenSearch versions 2.9 and higher.
+from IAMRoleHelper import IAMRoleHelper
+from SecretsHelper import SecretHelper
+
 class AIConnectorHelper:
     def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
                  opensearch_domain_password, aws_user_name, aws_role_name):
@@ -70,6 +69,20 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
             verify_certs=True,
             connection_class=RequestsHttpConnection
         )
+
+        # Initialize IAMRoleHelper and SecretHelper
+        self.iam_helper = IAMRoleHelper(
+            region=self.region,
+            opensearch_domain_url=self.opensearch_domain_url,
+            opensearch_domain_username=self.opensearch_domain_username,
+            opensearch_domain_password=self.opensearch_domain_password,
+            aws_user_name=self.aws_user_name,
+            aws_role_name=self.aws_role_name,
+            opensearch_domain_arn=self.opensearch_domain_arn
+        )
+
+        self.secret_helper = SecretHelper(self.region)
+
     @staticmethod
     def get_opensearch_domain_info(region, domain_name):
         """
@@ -85,217 +98,16 @@ def get_opensearch_domain_info(region, domain_name):
         except Exception as e:
             print(f"Error retrieving OpenSearch domain info: {e}")
             return None, None
-        
-    def get_user_arn(self, username):
-        if not username:
-            return None
-        # Create a boto3 client for IAM
-        iam_client = boto3.client('iam')
-
-        try:
-            # Get information about the IAM user
-            response = iam_client.get_user(UserName=username)
-            user_arn = response['User']['Arn']
-            return user_arn
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f"IAM user '{username}' not found.")
-            return None
-
-    def secret_exists(self, secret_name):
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
-        try:
-            # Try to get the secret
-            secretsmanager.get_secret_value(SecretId=secret_name)
-            # If no exception was raised by get_secret_value, the secret exists
-            return True
-        except secretsmanager.exceptions.ResourceNotFoundException:
-            # If a ResourceNotFoundException was raised, the secret does not exist
-            return False
-
-    def get_secret_arn(self, secret_name):
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
-        try:
-            response = secretsmanager.describe_secret(SecretId=secret_name)
-            # Return ARN of the secret 
-            return response['ARN']
-        except secretsmanager.exceptions.ResourceNotFoundException:
-            print(f"The requested secret {secret_name} was not found")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
-        
-    def get_secret(self, secret_name):
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
-        try:
-            response = secretsmanager.get_secret_value(SecretId=secret_name)
-        except secretsmanager.exceptions.NoSuchEntityException:
-            print("The requested secret was not found")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
-        else:
-            return response.get('SecretString')
-
-    def create_secret(self, secret_name, secret_value):
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
-
-        try:
-            response = secretsmanager.create_secret(
-                Name=secret_name,
-                SecretString=json.dumps(secret_value),
-            )
-            print(f'Secret {secret_name} created successfully.')
-            return response['ARN']  # Return the ARN of the created secret
-        except BotoCoreError as e:
-            print(f'Error creating secret: {e}')
-            return None
-
-
-    def role_exists(self, role_name):
-        iam_client = boto3.client('iam')
-
-        try:
-            iam_client.get_role(RoleName=role_name)
-            return True
-        except iam_client.exceptions.NoSuchEntityException:
-            return False
-
-    def delete_role(self, role_name):
-        iam_client = boto3.client('iam')
-
-        try:
-            # Detach managed policies
-            policies = iam_client.list_attached_role_policies(RoleName=role_name)['AttachedPolicies']
-            for policy in policies:
-                iam_client.detach_role_policy(RoleName=role_name, PolicyArn=policy['PolicyArn'])
-            print(f'All managed policies detached from role {role_name}.')
-
-            # Delete inline policies
-            inline_policies = iam_client.list_role_policies(RoleName=role_name)['PolicyNames']
-            for policy_name in inline_policies:
-                iam_client.delete_role_policy(RoleName=role_name, PolicyName=policy_name)
-            print(f'All inline policies deleted from role {role_name}.')
-
-            # Now, delete the role
-            iam_client.delete_role(RoleName=role_name)
-            print(f'Role {role_name} deleted.')
-
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f'Role {role_name} does not exist.')
-
-
-    def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
-        iam_client = boto3.client('iam')
-
-        try:
-            # Create the role with the trust policy
-            create_role_response = iam_client.create_role(
-                RoleName=role_name,
-                AssumeRolePolicyDocument=json.dumps(trust_policy_json),
-                Description='Role with custom trust and inline policies',
-            )
-
-            # Get the ARN of the newly created role
-            role_arn = create_role_response['Role']['Arn']
-
-            # Attach the inline policy to the role
-            iam_client.put_role_policy(
-                RoleName=role_name,
-                PolicyName='InlinePolicy',  # you can replace this with your preferred policy name
-                PolicyDocument=json.dumps(inline_policy_json)
-            )
-
-            print(f'Created role: {role_name}')
-            return role_arn
-
-        except Exception as e:
-            print(f"Error creating the role: {e}")
-            return None
-
-    def get_role_arn(self, role_name):
-        if not role_name:
-            return None
-        iam_client = boto3.client('iam')
-        try:
-            response = iam_client.get_role(RoleName=role_name)
-            # Return ARN of the role
-            return response['Role']['Arn']
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f"The requested role {role_name} does not exist")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
-    
-    
-    def get_role_details(self, role_name):
-        iam = boto3.client('iam')
-
-        try:
-            response = iam.get_role(RoleName=role_name)
-            role = response['Role']
-
-            print(f"Role Name: {role['RoleName']}")
-            print(f"Role ID: {role['RoleId']}")
-            print(f"ARN: {role['Arn']}")
-            print(f"Creation Date: {role['CreateDate']}")
-            print("Assume Role Policy Document:")
-            print(json.dumps(role['AssumeRolePolicyDocument'], indent=4, sort_keys=True))
-
-            list_role_policies_response = iam.list_role_policies(RoleName=role_name)
 
-            for policy_name in list_role_policies_response['PolicyNames']:
-                get_role_policy_response = iam.get_role_policy(RoleName=role_name, PolicyName=policy_name)
-                print(f"Role Policy Name: {get_role_policy_response['PolicyName']}")
-                print("Role Policy Document:")
-                print(json.dumps(get_role_policy_response['PolicyDocument'], indent=4, sort_keys=True))
-
-        except iam.exceptions.NoSuchEntityException:
-            print(f'Role {role_name} does not exist.')
-
-    def map_iam_role_to_backend_role(self, iam_role_arn):
-        os_security_role = 'ml_full_access'  # Changed from 'all_access' to 'ml_full_access'
-        url = f'{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}'
-
-        payload = {
-            "backend_roles": [iam_role_arn]
-        }
-        headers = {'Content-Type': 'application/json'}
-
-        response = requests.put(url, auth=(self.opensearch_domain_username, self.opensearch_domain_password),
-                                json=payload, headers=headers, verify=True)
-
-        if response.status_code == 200:
-            print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
-        else:
-            print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
-            print(f"Response: {response.text}")
-
-    def assume_role(self, create_connector_role_arn, role_session_name="your_session_name"):
-        sts_client = boto3.client('sts')
-
-        #role_arn = f"arn:aws:iam::{aws_account_id}:role/{role_name}"
-        assumed_role_object = sts_client.assume_role(
-            RoleArn=create_connector_role_arn,
-            RoleSessionName=role_session_name,
-        )
-
-        # Obtain the temporary credentials from the assumed role 
-        temp_credentials = assumed_role_object["Credentials"]
-
-        return temp_credentials
-    
     def get_ml_auth(self, create_connector_role_name):
         """
         Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
         """
-        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
+        create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         if not create_connector_role_arn:
             raise Exception(f"IAM role '{create_connector_role_name}' not found.")
 
-        temp_credentials = self.assume_role(create_connector_role_arn)
+        temp_credentials = self.iam_helper.assume_role(create_connector_role_arn)
         awsauth = AWS4Auth(
             temp_credentials["AccessKeyId"],
             temp_credentials["SecretAccessKey"],
@@ -306,8 +118,8 @@ def get_ml_auth(self, create_connector_role_name):
         return awsauth
 
     def create_connector(self, create_connector_role_name, payload):
-        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
-        temp_credentials = self.assume_role(create_connector_role_arn)
+        create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
+        temp_credentials = self.iam_helper.assume_role(create_connector_role_arn)
         awsauth = AWS4Auth(
             temp_credentials["AccessKeyId"],
             temp_credentials["SecretAccessKey"],
@@ -325,8 +137,8 @@ def create_connector(self, create_connector_role_name, payload):
         print(r.text)
         connector_id = json.loads(r.text)['connector_id']
         return connector_id
-    
-    def search_model_group(self, model_group_name):
+
+    def search_model_group(self, model_group_name, create_connector_role_name):
         payload = {
             "query": {
                 "term": {
@@ -337,68 +149,52 @@ def search_model_group(self, model_group_name):
             }
         }
         headers = {"Content-Type": "application/json"}
-        
+
         # Obtain temporary credentials
-        create_connector_role_arn = self.get_role_arn('my_test_create_bedrock_connector_role')  # Replace with actual role name
-        temp_credentials = self.assume_role(create_connector_role_arn)
-        awsauth = AWS4Auth(
-            temp_credentials["AccessKeyId"],
-            temp_credentials["SecretAccessKey"],
-            self.region,
-            'es',
-            session_token=temp_credentials["SessionToken"],
-        )
-        
+        awsauth = self.get_ml_auth(create_connector_role_name)
+
         r = requests.post(
             f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_search',
             auth=awsauth,
             json=payload,
             headers=headers
         )
-        
+
         response = json.loads(r.text)
         return response
-    
+
     def create_model_group(self, model_group_name, description, create_connector_role_name):
-        search_model_group_response = self.search_model_group(model_group_name)
+        search_model_group_response = self.search_model_group(model_group_name, create_connector_role_name)
         print("Search Model Group Response:", search_model_group_response)
-        
+
         if 'hits' in search_model_group_response and search_model_group_response['hits']['total']['value'] > 0:
             return search_model_group_response['hits']['hits'][0]['_id']
-        
+
         payload = {
             "name": model_group_name,
             "description": description
         }
         headers = {"Content-Type": "application/json"}
-        
+
         # Obtain temporary credentials using the provided role name
-        create_connector_role_arn = self.get_role_arn(create_connector_role_name)
-        temp_credentials = self.assume_role(create_connector_role_arn)
-        awsauth = AWS4Auth(
-            temp_credentials["AccessKeyId"],
-            temp_credentials["SecretAccessKey"],
-            self.region,
-            'es',
-            session_token=temp_credentials["SessionToken"],
-        )
-        
+        awsauth = self.get_ml_auth(create_connector_role_name)
+
         r = requests.post(
             f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_register',
             auth=awsauth,
             json=payload,
             headers=headers
         )
-        
+
         print(r.text)
         response = json.loads(r.text)
-        
+
         if 'model_group_id' in response:
             return response['model_group_id']
         else:
             # Handle error gracefully
             raise KeyError("The response does not contain 'model_group_id'. Response content: {}".format(response))
-    
+
     def get_task(self, task_id, create_connector_role_name):
         try:
             awsauth = self.get_ml_auth(create_connector_role_name)
@@ -411,7 +207,7 @@ def get_task(self, task_id, create_connector_role_name):
         except Exception as e:
             print(f"Error in get_task: {e}")
             raise
-    
+
     def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
         try:
             model_group_id = self.create_model_group(model_name, description, create_connector_role_name)
@@ -456,13 +252,17 @@ def create_model(self, model_name, description, connector_id, create_connector_r
         except Exception as e:
             print(f"Error in create_model: {e}")
             raise
-    
+
     def deploy_model(self, model_id):
         headers = {"Content-Type": "application/json"}
-        return requests.post(f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy',
-                             auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
-                             headers=headers)
-    
+        response = requests.post(
+            f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy',
+            auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
+            headers=headers
+        )
+        print(f"Deploy Model Response: {response.text}")
+        return response
+
     def predict(self, model_id, payload):
         headers = {"Content-Type": "application/json"}
         r = requests.post(
@@ -471,30 +271,32 @@ def predict(self, model_id, payload):
             json=payload,
             headers=headers
         )
-    
-    def create_connector_with_secret(self, secret_name, secret_value, connector_role_name, create_connector_role_name, create_connector_input, sleep_time_in_seconds=10):
+        print("Predict Response:", r.text)
+        return r
+
+    def create_connector_with_secret(self, secret_name, secret_value, connector_role_name, create_connector_role_name,
+                                     create_connector_input, sleep_time_in_seconds=10):
         # Step1: Create Secret
         print('Step1: Create Secret')
-        if not self.secret_exists(secret_name):
-            secret_arn = self.create_secret(secret_name, secret_value)
+        if not self.secret_helper.secret_exists(secret_name):
+            secret_arn = self.secret_helper.create_secret(secret_name, secret_value)
         else:
-            print('secret exists, skip creating')
-            secret_arn = self.get_secret_arn(secret_name)
-        #print(secret_arn)
+            print('Secret exists, skipping creation.')
+            secret_arn = self.secret_helper.get_secret_arn(secret_name)
         print('----------')
-        
-        # Step2: Create IAM role configued in connector
+
+        # Step2: Create IAM role configured in connector
         trust_policy = {
-          "Version": "2012-10-17",
-          "Statement": [
-            {
-              "Effect": "Allow",
-              "Principal": {
-                "Service": "es.amazonaws.com"
-              },
-              "Action": "sts:AssumeRole"
-            }
-          ]
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Effect": "Allow",
+                    "Principal": {
+                        "Service": "es.amazonaws.com"
+                    },
+                    "Action": "sts:AssumeRole"
+                }
+            ]
         }
 
         inline_policy = {
@@ -511,19 +313,18 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
             ]
         }
 
-        print('Step2: Create IAM role configued in connector')
-        if not self.role_exists(connector_role_name):
-            connector_role_arn = self.create_iam_role(connector_role_name, trust_policy, inline_policy)
+        print('Step2: Create IAM role configured in connector')
+        if not self.iam_helper.role_exists(connector_role_name):
+            connector_role_arn = self.iam_helper.create_iam_role(connector_role_name, trust_policy, inline_policy)
         else:
-            print('role exists, skip creating')
-            connector_role_arn = self.get_role_arn(connector_role_name)
-        #print(connector_role_arn)
+            print('Role exists, skipping creation.')
+            connector_role_arn = self.iam_helper.get_role_arn(connector_role_name)
         print('----------')
-        
+
         # Step 3: Configure IAM role in OpenSearch
         # 3.1 Create IAM role for Signing create connector request
-        user_arn = self.get_user_arn(self.aws_user_name)
-        role_arn = self.get_role_arn(self.aws_role_name)
+        user_arn = self.iam_helper.get_user_arn(self.aws_user_name)
+        role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
         statements = []
         if user_arn:
             statements.append({
@@ -564,19 +365,19 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
 
         print('Step 3: Configure IAM role in OpenSearch')
         print('Step 3.1: Create IAM role for Signing create connector request')
-        if not self.role_exists(create_connector_role_name):
-            create_connector_role_arn = self.create_iam_role(create_connector_role_name, trust_policy, inline_policy)
+        if not self.iam_helper.role_exists(create_connector_role_name):
+            create_connector_role_arn = self.iam_helper.create_iam_role(create_connector_role_name, trust_policy,
+                                                                       inline_policy)
         else:
-            print('role exists, skip creating')
-            create_connector_role_arn = self.get_role_arn(create_connector_role_name)
-        #print(create_connector_role_arn)
+            print('Role exists, skipping creation.')
+            create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         print('----------')
-        
+
         # 3.2 Map backend role
         print(f'Step 3.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
-        self.map_iam_role_to_backend_role(create_connector_role_arn)
+        self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
         print('----------')
-        
+
         # 4. Create connector
         print('Step 4: Create connector in OpenSearch')
         # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
@@ -584,7 +385,7 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
         # So we wait for some time before creating connector.
         # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
         # you can rerun this function.
-        
+
         # Wait for some time
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
@@ -593,106 +394,105 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
             "roleArn": connector_role_arn
         }
         connector_id = self.create_connector(create_connector_role_name, payload)
-        #print(connector_id)
         print('----------')
         return connector_id
-    
-    def create_connector_with_role(self, connector_role_inline_policy, connector_role_name, create_connector_role_name, create_connector_input, sleep_time_in_seconds=10):
-            # Step1: Create IAM role configued in connector
-            trust_policy = {
+
+    def create_connector_with_role(self, connector_role_inline_policy, connector_role_name, create_connector_role_name,
+                                   create_connector_input, sleep_time_in_seconds=10):
+        # Step1: Create IAM role configured in connector
+        trust_policy = {
             "Version": "2012-10-17",
             "Statement": [
                 {
+                    "Effect": "Allow",
+                    "Principal": {
+                        "Service": "es.amazonaws.com"
+                    },
+                    "Action": "sts:AssumeRole"
+                }
+            ]
+        }
+
+        print('Step1: Create IAM role configured in connector')
+        if not self.iam_helper.role_exists(connector_role_name):
+            connector_role_arn = self.iam_helper.create_iam_role(connector_role_name, trust_policy,
+                                                                 connector_role_inline_policy)
+        else:
+            print('Role exists, skipping creation.')
+            connector_role_arn = self.iam_helper.get_role_arn(connector_role_name)
+        print('----------')
+
+        # Step 2: Configure IAM role in OpenSearch
+        # 2.1 Create IAM role for Signing create connector request
+        user_arn = self.iam_helper.get_user_arn(self.aws_user_name)
+        role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
+        statements = []
+        if user_arn:
+            statements.append({
                 "Effect": "Allow",
                 "Principal": {
-                    "Service": "es.amazonaws.com"
+                    "AWS": user_arn
                 },
                 "Action": "sts:AssumeRole"
-                }
-            ]
-            }
+            })
+        if role_arn:
+            statements.append({
+                "Effect": "Allow",
+                "Principal": {
+                    "AWS": role_arn
+                },
+                "Action": "sts:AssumeRole"
+            })
+        trust_policy = {
+            "Version": "2012-10-17",
+            "Statement": statements
+        }
 
-            print('Step1: Create IAM role configued in connector')
-            if not self.role_exists(connector_role_name):
-                connector_role_arn = self.create_iam_role(connector_role_name, trust_policy, connector_role_inline_policy)
-            else:
-                print('role exists, skip creating')
-                connector_role_arn = self.get_role_arn(connector_role_name)
-            #print(connector_role_arn)
-            print('----------')
-
-            # Step 2: Configure IAM role in OpenSearch
-            # 2.1 Create IAM role for Signing create connector request
-            user_arn = self.get_user_arn(self.aws_user_name)
-            role_arn = self.get_role_arn(self.aws_role_name)
-            statements = []
-            if user_arn:
-                statements.append({
+        inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
                     "Effect": "Allow",
-                    "Principal": {
-                        "AWS": user_arn
-                    },
-                    "Action": "sts:AssumeRole"
-                })
-            if role_arn:
-                statements.append({
+                    "Action": "iam:PassRole",
+                    "Resource": connector_role_arn
+                },
+                {
                     "Effect": "Allow",
-                    "Principal": {
-                        "AWS": role_arn
-                    },
-                    "Action": "sts:AssumeRole"
-                })
-            trust_policy = {
-                "Version": "2012-10-17",
-                "Statement": statements
-            }
+                    "Action": "es:ESHttpPost",
+                    "Resource": self.opensearch_domain_arn
+                }
+            ]
+        }
 
-            inline_policy = {
-                "Version": "2012-10-17",
-                "Statement": [
-                    {
-                        "Effect": "Allow",
-                        "Action": "iam:PassRole",
-                        "Resource": connector_role_arn
-                    },
-                    {
-                        "Effect": "Allow",
-                        "Action": "es:ESHttpPost",
-                        "Resource": self.opensearch_domain_arn
-                    }
-                ]
-            }
+        print('Step 2: Configure IAM role in OpenSearch')
+        print('Step 2.1: Create IAM role for Signing create connector request')
+        if not self.iam_helper.role_exists(create_connector_role_name):
+            create_connector_role_arn = self.iam_helper.create_iam_role(create_connector_role_name, trust_policy,
+                                                                       inline_policy)
+        else:
+            print('Role exists, skipping creation.')
+            create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
+        print('----------')
 
-            print('Step 2: Configure IAM role in OpenSearch')
-            print('Step 2.1: Create IAM role for Signing create connector request')
-            if not self.role_exists(create_connector_role_name):
-                create_connector_role_arn = self.create_iam_role(create_connector_role_name, trust_policy, inline_policy)
-            else:
-                print('role exists, skip creating')
-                create_connector_role_arn = self.get_role_arn(create_connector_role_name)
-            #print(create_connector_role_arn)
-            print('----------')
-
-            # 2.2 Map backend role
-            print(f'Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
-            self.map_iam_role_to_backend_role(create_connector_role_arn)
-            print('----------')
-
-            # 3. Create connector
-            print('Step 3: Create connector in OpenSearch')
-            # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
-            # During this time, some services might not immediately recognize the new role or its permissions.
-            # So we wait for some time before creating connector.
-            # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
-            # you can rerun this function.
-
-            # Wait for some time
-            time.sleep(sleep_time_in_seconds)
-            payload = create_connector_input
-            payload['credential'] = {
-                "roleArn": connector_role_arn
-            }
-            connector_id = self.create_connector(create_connector_role_name, payload)
-            #print(connector_id)
-            print('----------')
-            return connector_id
\ No newline at end of file
+        # 2.2 Map backend role
+        print(f'Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
+        self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
+        print('----------')
+
+        # 3. Create connector
+        print('Step 3: Create connector in OpenSearch')
+        # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
+        # During this time, some services might not immediately recognize the new role or its permissions.
+        # So we wait for some time before creating connector.
+        # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
+        # you can rerun this function.
+
+        # Wait for some time
+        time.sleep(sleep_time_in_seconds)
+        payload = create_connector_input
+        payload['credential'] = {
+            "roleArn": connector_role_arn
+        }
+        connector_id = self.create_connector(create_connector_role_name, payload)
+        print('----------')
+        return connector_id
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
new file mode 100644
index 00000000..9f0d85f6
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
@@ -0,0 +1,190 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import boto3
+import json
+from botocore.exceptions import BotoCoreError
+import requests
+
+class IAMRoleHelper:
+    def __init__(self, region, opensearch_domain_url=None, opensearch_domain_username=None,
+                 opensearch_domain_password=None, aws_user_name=None, aws_role_name=None, opensearch_domain_arn=None):
+        self.region = region
+        self.opensearch_domain_url = opensearch_domain_url
+        self.opensearch_domain_username = opensearch_domain_username
+        self.opensearch_domain_password = opensearch_domain_password
+        self.aws_user_name = aws_user_name
+        self.aws_role_name = aws_role_name
+        self.opensearch_domain_arn = opensearch_domain_arn
+
+    def role_exists(self, role_name):
+        iam_client = boto3.client('iam')
+
+        try:
+            iam_client.get_role(RoleName=role_name)
+            return True
+        except iam_client.exceptions.NoSuchEntityException:
+            return False
+
+    def delete_role(self, role_name):
+        iam_client = boto3.client('iam')
+
+        try:
+            # Detach managed policies
+            policies = iam_client.list_attached_role_policies(RoleName=role_name)['AttachedPolicies']
+            for policy in policies:
+                iam_client.detach_role_policy(RoleName=role_name, PolicyArn=policy['PolicyArn'])
+            print(f'All managed policies detached from role {role_name}.')
+
+            # Delete inline policies
+            inline_policies = iam_client.list_role_policies(RoleName=role_name)['PolicyNames']
+            for policy_name in inline_policies:
+                iam_client.delete_role_policy(RoleName=role_name, PolicyName=policy_name)
+            print(f'All inline policies deleted from role {role_name}.')
+
+            # Now, delete the role
+            iam_client.delete_role(RoleName=role_name)
+            print(f'Role {role_name} deleted.')
+
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f'Role {role_name} does not exist.')
+
+    def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
+        iam_client = boto3.client('iam')
+
+        try:
+            # Create the role with the trust policy
+            create_role_response = iam_client.create_role(
+                RoleName=role_name,
+                AssumeRolePolicyDocument=json.dumps(trust_policy_json),
+                Description='Role with custom trust and inline policies',
+            )
+
+            # Get the ARN of the newly created role
+            role_arn = create_role_response['Role']['Arn']
+
+            # Attach the inline policy to the role
+            iam_client.put_role_policy(
+                RoleName=role_name,
+                PolicyName='InlinePolicy',  # you can replace this with your preferred policy name
+                PolicyDocument=json.dumps(inline_policy_json)
+            )
+
+            print(f'Created role: {role_name}')
+            return role_arn
+
+        except Exception as e:
+            print(f"Error creating the role: {e}")
+            return None
+
+    def get_role_arn(self, role_name):
+        if not role_name:
+            return None
+        iam_client = boto3.client('iam')
+        try:
+            response = iam_client.get_role(RoleName=role_name)
+            # Return ARN of the role
+            return response['Role']['Arn']
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f"The requested role {role_name} does not exist")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+
+    def get_role_details(self, role_name):
+        iam = boto3.client('iam')
+
+        try:
+            response = iam.get_role(RoleName=role_name)
+            role = response['Role']
+
+            print(f"Role Name: {role['RoleName']}")
+            print(f"Role ID: {role['RoleId']}")
+            print(f"ARN: {role['Arn']}")
+            print(f"Creation Date: {role['CreateDate']}")
+            print("Assume Role Policy Document:")
+            print(json.dumps(role['AssumeRolePolicyDocument'], indent=4, sort_keys=True))
+
+            list_role_policies_response = iam.list_role_policies(RoleName=role_name)
+
+            for policy_name in list_role_policies_response['PolicyNames']:
+                get_role_policy_response = iam.get_role_policy(RoleName=role_name, PolicyName=policy_name)
+                print(f"Role Policy Name: {get_role_policy_response['PolicyName']}")
+                print("Role Policy Document:")
+                print(json.dumps(get_role_policy_response['PolicyDocument'], indent=4, sort_keys=True))
+
+        except iam.exceptions.NoSuchEntityException:
+            print(f'Role {role_name} does not exist.')
+
+    def get_user_arn(self, username):
+        if not username:
+            return None
+        # Create a boto3 client for IAM
+        iam_client = boto3.client('iam')
+
+        try:
+            # Get information about the IAM user
+            response = iam_client.get_user(UserName=username)
+            user_arn = response['User']['Arn']
+            return user_arn
+        except iam_client.exceptions.NoSuchEntityException:
+            print(f"IAM user '{username}' not found.")
+            return None
+
+    def assume_role(self, role_arn, role_session_name="your_session_name"):
+        sts_client = boto3.client('sts')
+
+        assumed_role_object = sts_client.assume_role(
+            RoleArn=role_arn,
+            RoleSessionName=role_session_name,
+        )
+
+        # Obtain the temporary credentials from the assumed role 
+        temp_credentials = assumed_role_object["Credentials"]
+
+        return temp_credentials
+
+    def map_iam_role_to_backend_role(self, iam_role_arn):
+        os_security_role = 'ml_full_access'  # Changed from 'all_access' to 'ml_full_access'
+        url = f'{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}'
+
+        payload = {
+            "backend_roles": [iam_role_arn]
+        }
+        headers = {'Content-Type': 'application/json'}
+
+        response = requests.put(
+            url,
+            auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+            json=payload,
+            headers=headers,
+            verify=True
+        )
+
+        if response.status_code == 200:
+            print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
+        else:
+            print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
+            print(f"Response: {response.text}")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
new file mode 100644
index 00000000..03825eeb
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
@@ -0,0 +1,81 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import boto3
+import json
+from botocore.exceptions import BotoCoreError
+
+class SecretHelper:
+    def __init__(self, region):
+        self.region = region
+
+    def secret_exists(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            # Try to get the secret
+            secretsmanager.get_secret_value(SecretId=secret_name)
+            # If no exception was raised by get_secret_value, the secret exists
+            return True
+        except secretsmanager.exceptions.ResourceNotFoundException:
+            # If a ResourceNotFoundException was raised, the secret does not exist
+            return False
+
+    def get_secret_arn(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            response = secretsmanager.describe_secret(SecretId=secret_name)
+            # Return ARN of the secret 
+            return response['ARN']
+        except secretsmanager.exceptions.ResourceNotFoundException:
+            print(f"The requested secret {secret_name} was not found")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+
+    def get_secret(self, secret_name):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        try:
+            response = secretsmanager.get_secret_value(SecretId=secret_name)
+        except secretsmanager.exceptions.NoSuchEntityException:
+            print("The requested secret was not found")
+            return None
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            return None
+        else:
+            return response.get('SecretString')
+
+    def create_secret(self, secret_name, secret_value):
+        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+
+        try:
+            response = secretsmanager.create_secret(
+                Name=secret_name,
+                SecretString=json.dumps(secret_value),
+            )
+            print(f'Secret {secret_name} created successfully.')
+            return response['ARN']  # Return the ARN of the created secret
+        except BotoCoreError as e:
+            print(f'Error creating secret: {e}')
+            return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 7b766939..2be1ed06 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -201,9 +201,6 @@ def create_ingest_pipeline(self):
 
 
     def process_and_ingest_data(self, file_paths: List[str]):
-        # Process and ingest data from multiple files
-        # Generates embeddings for each document and ingests into OpenSearch
-        # Displays progress and results of the ingestion process
         if not self.initialize_clients():
             print("Failed to initialize clients. Aborting ingestion.")
             return
@@ -255,16 +252,15 @@ def process_and_ingest_data(self, file_paths: List[str]):
                     "_index": self.index_name,
                     "_source": {
                         "nominee_text": doc['text'],
-                        "nominee_vector": doc['embedding']  # This is now a list of floats
+                        "nominee_vector": doc['embedding']
                     },
-                    "_pipeline": 'text-chunking-ingest-pipeline'  # Specify the ingest pipeline here
+                    "pipeline": 'text-chunking-ingest-pipeline'  # Use "pipeline" instead of "_pipeline"
                 }
                 actions.append(action)
         
         success, failed = self.opensearch.bulk_index(actions)
         print(f"{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
         print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
-
     def ingest_command(self, paths: List[str]):
         # Main ingestion command
         # Processes all valid files in the given paths and initiates ingestion
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
new file mode 100644
index 00000000..876c22d4
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -0,0 +1,1058 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+
+
+import os
+import json
+import time
+import boto3
+from urllib.parse import urlparse
+from colorama import Fore, Style, init
+from AIConnectorHelper import AIConnectorHelper  # Ensure this module is accessible
+import sys
+
+init(autoreset=True)
+
+class ModelRegister:
+    def __init__(self, config, opensearch_client, opensearch_domain_name):
+        # Initialize ModelRegister with necessary configurations
+        self.config = config
+        self.aws_region = config.get('region')
+        self.opensearch_client = opensearch_client
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = config.get('opensearch_username')
+        self.opensearch_password = config.get('opensearch_password')
+        self.iam_principal = config.get('iam_principal')
+        self.embedding_dimension = int(config.get('embedding_dimension', 768))
+        self.service_type = config.get('service_type', 'managed')
+        self.bedrock_client = None
+        if self.service_type != 'open-source':
+            self.initialize_clients()
+
+    def initialize_clients(self):
+        # Initialize AWS clients only if necessary
+        if self.service_type in ['managed', 'serverless']:
+            try:
+                self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+                # Add any other clients initialization if needed
+                time.sleep(7)
+                print("AWS clients initialized successfully.")
+                return True
+            except Exception as e:
+                print(f"Failed to initialize AWS clients: {e}")
+                return False
+        else:
+            # No AWS clients needed for open-source
+            return True
+
+    def prompt_model_registration(self):
+        """
+        Prompt the user to register a model or input an existing model ID.
+        """
+        print("\nTo proceed, you need to configure an embedding model.")
+        print("1. Register a new embedding model")
+        print("2. Use an existing embedding model ID")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            self.register_model_interactive()
+        elif choice == '2':
+            model_id = input("Please enter your existing embedding model ID: ").strip()
+            if model_id:
+                self.config['embedding_model_id'] = model_id
+                self.save_config(self.config)
+                print(f"{Fore.GREEN}Model ID '{model_id}' saved successfully in configuration.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}No model ID provided. Cannot proceed without an embedding model.{Style.RESET_ALL}")
+                sys.exit(1)  # Exit the setup as we cannot proceed without a model ID
+        else:
+            print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}")
+            sys.exit(1)  # Exit the setup as we cannot proceed without a valid choice
+    def get_custom_model_details(self, default_input):
+        """
+        Prompt the user to enter custom model details or use default.
+        Returns a dictionary with the model details.
+        """
+        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom model settings")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            return default_input
+        elif choice == '2':
+            print("Please enter your model details as a JSON object.")
+            print("Example:")
+            print(json.dumps(default_input, indent=2))
+            json_input = input("Enter your JSON object: ").strip()
+            try:
+                custom_details = json.loads(json_input)
+                return custom_details
+            except json.JSONDecodeError as e:
+                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+                return None
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return None
+        
+    def save_config(self, config):
+        # Save configuration to the config file
+        import configparser
+        parser = configparser.ConfigParser()
+        parser['DEFAULT'] = config
+        with open('config.ini', 'w') as f:
+            parser.write(f)
+
+    def register_model_interactive(self):
+        """
+        Interactive method to register a new embedding model during setup.
+        """
+        # Initialize clients
+        if not self.initialize_clients():
+            print(f"{Fore.RED}Failed to initialize AWS clients. Cannot proceed.{Style.RESET_ALL}")
+            return
+
+        # Ensure opensearch_endpoint is set
+        if not self.config.get('opensearch_endpoint'):
+            print(f"{Fore.RED}OpenSearch endpoint not set. Please run 'setup' command first.{Style.RESET_ALL}")
+            return
+
+        # Extract the IAM user name from the IAM principal ARN
+        aws_user_name = self.get_iam_user_name_from_arn(self.iam_principal)
+
+        if not aws_user_name:
+            print("Could not extract IAM user name from IAM principal ARN.")
+            aws_user_name = input("Enter your AWS IAM user name: ")
+
+        # Instantiate AIConnectorHelper
+        helper = AIConnectorHelper(
+            region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_domain_username=self.opensearch_username,
+            opensearch_domain_password=self.opensearch_password,
+            aws_user_name=aws_user_name,
+            aws_role_name=None  # Set to None or provide if applicable
+        )
+
+        # Prompt user to select a model
+        print("Please select an embedding model to register:")
+        print("1. Bedrock Titan Embedding Model")
+        print("2. SageMaker Embedding Model")
+        print("3. Cohere Embedding Model")
+        print("4. OpenAI Embedding Model")
+        model_choice = input("Enter your choice (1-4): ")
+
+        # Call the appropriate method based on the user's choice
+        if model_choice == '1':
+            self.register_bedrock_model(helper)
+        elif model_choice == '2':
+            self.register_sagemaker_model(helper)
+        elif model_choice == '3':
+            self.register_cohere_model(helper)
+        elif model_choice == '4':
+            self.register_openai_model(helper)
+        else:
+            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
+            return
+
+    def get_iam_user_name_from_arn(self, iam_principal_arn):
+        """
+        Extract the IAM user name from the IAM principal ARN.
+        """
+        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
+        if iam_principal_arn and ':user/' in iam_principal_arn:
+            return iam_principal_arn.split(':user/')[-1]
+        else:
+            return None
+
+    def register_bedrock_model(self, helper):
+        """
+        Register a Bedrock embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
+        connector_role_name = "my_test_bedrock_connector_role"
+        create_connector_role_name = "my_test_create_bedrock_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["bedrock:InvokeModel"],
+                    "Effect": "Allow",
+                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
+                }
+            ]
+        }
+
+        # Default connector input
+        default_connector_input = {
+            "name": "Amazon Bedrock Connector: titan embedding v1",
+            "description": "The connector to Bedrock Titan embedding model",
+            "version": 1,
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": bedrock_region,
+                "service_name": "bedrock"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
+                    "headers": {
+                        "content-type": "application/json",
+                        "x-amz-content-sha256": "required"
+                    },
+                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
+                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
+                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        print("Creating connector...")
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        print("Registering model...")
+        model_name = create_connector_input.get('name', 'Bedrock embedding model')
+        description = create_connector_input.get('description', 'Bedrock embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"{Fore.GREEN}Model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+        
+    def register_sagemaker_model(self, helper):
+        """
+        Register a SageMaker embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ")
+        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ")
+        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ") or self.aws_region
+        connector_role_name = "my_test_sagemaker_connector_role"
+        create_connector_role_name = "my_test_create_sagemaker_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["sagemaker:InvokeEndpoint"],
+                    "Effect": "Allow",
+                    "Resource": sagemaker_endpoint_arn
+                }
+            ]
+        }
+
+        # Create connector input
+        create_connector_input = {
+            "name": "SageMaker embedding model connector",
+            "description": "Connector for my SageMaker embedding model",
+            "version": "1.0",
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": sagemaker_region,
+                "service_name": "sagemaker"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "headers": {
+                        "content-type": "application/json"
+                    },
+                    "url": sagemaker_endpoint_url,
+                    "request_body": "${parameters.input}",
+                    "pre_process_function": "connector.pre_process.default.embedding",
+                    "post_process_function": "connector.post_process.default.embedding"
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = 'SageMaker embedding model'
+        description = 'SageMaker embedding model for semantic search'
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+
+    def register_cohere_model(self, helper):
+        """
+        Register a Cohere embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'cohere_api_key'
+        cohere_api_key = input("Enter your Cohere API key: ")
+        secret_value = {secret_key: cohere_api_key}
+
+        connector_role_name = "my_test_cohere_connector_role"
+        create_connector_role_name = "my_test_create_cohere_connector_role"
+
+        # Default connector input
+        default_connector_input = {
+            "name": "Cohere Embedding Model Connector",
+            "description": "Connector for Cohere embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "embed-english-v3.0",
+                "input_type": "search_document",
+                "truncate": "END"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.cohere.ai/v1/embed",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                        "Request-Source": "unspecified:opensearch"
+                    },
+                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                    "pre_process_function": "connector.pre_process.cohere.embedding",
+                    "post_process_function": "connector.post_process.cohere.embedding"
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = create_connector_input.get('name', 'Cohere embedding model')
+        description = create_connector_input.get('description', 'Cohere embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+
+    def register_openai_model(self, helper):
+        """
+        Register an OpenAI embedding model by creating the necessary connector and model in OpenSearch.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'openai_api_key'
+        openai_api_key = input("Enter your OpenAI API key: ")
+        secret_value = {secret_key: openai_api_key}
+
+        connector_role_name = "my_test_openai_connector_role"
+        create_connector_role_name = "my_test_create_openai_connector_role"
+
+        # Default connector input
+        default_connector_input = {
+            "name": "OpenAI Embedding Model Connector",
+            "description": "Connector for OpenAI embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "text-embedding-ada-002"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.openai.com/v1/embeddings",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                        "Content-Type": "application/json"
+                    },
+                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                    "pre_process_function": "connector.pre_process.openai.embedding",
+                    "post_process_function": "connector.post_process.openai.embedding"
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = create_connector_input.get('name', 'OpenAI embedding model')
+        description = create_connector_input.get('description', 'OpenAI embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        self.config['embedding_model_id'] = model_id
+        self.save_config(self.config)
+        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+
+    def prompt_opensource_model_registration(self):
+        """
+        Handle model registration for open-source OpenSearch.
+        """
+        print("\nWould you like to register an embedding model now?")
+        print("1. Yes, register a new model")
+        print("2. No, I will register the model later")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            self.register_model_opensource_interactive()
+        elif choice == '2':
+            print("Skipping model registration. You can register models later using the appropriate commands.")
+        else:
+            print(f"{Fore.RED}Invalid choice. Skipping model registration.{Style.RESET_ALL}")
+
+    def register_model_opensource_interactive(self):
+        """
+        Interactive method to register a new embedding model for open-source OpenSearch.
+        """
+        # Ensure OpenSearch client is initialized
+        if not self.opensearch_client:
+            print(f"{Fore.RED}OpenSearch client is not initialized. Please run setup again.{Style.RESET_ALL}")
+            return
+
+        # Prompt user to select a model
+        print("\nPlease select an embedding model to register:")
+        print("1. Cohere Embedding Model")
+        print("2. OpenAI Embedding Model")
+        print("3. Hugging Face Transformers Model")
+        print("4. Custom PyTorch Model")
+        model_choice = input("Enter your choice (1-4): ")
+
+        if model_choice == '1':
+            self.register_cohere_model_opensource()
+        elif model_choice == '2':
+            self.register_openai_model_opensource()
+        elif model_choice == '3':
+            self.register_huggingface_model()
+        elif model_choice == '4':
+            self.register_custom_pytorch_model()
+        else:
+            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
+            return
+
+    def register_cohere_model_opensource(self):
+        """
+        Register a Cohere embedding model in open-source OpenSearch.
+        """
+        cohere_api_key = input("Enter your Cohere API key: ").strip()
+        if not cohere_api_key:
+            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
+            return
+
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            connector_payload = {
+                "name": "Cohere Embedding Connector",
+                "description": "Connector for Cohere embedding model",
+                "version": "1.0",
+                "protocol": "http",
+                "parameters": {
+                    "model": "embed-english-v3.0",
+                    "input_type": "search_document",
+                    "truncate": "END"
+                },
+                "credential": {
+                    "cohere_key": cohere_api_key
+                },
+                "actions": [
+                    {
+                        "action_type": "predict",
+                        "method": "POST",
+                        "url": "https://api.cohere.ai/v1/embed",
+                        "headers": {
+                            "Authorization": "Bearer ${credential.cohere_key}",
+                            "Request-Source": "unspecified:opensearch"
+                        },
+                        "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                        "pre_process_function": "connector.pre_process.cohere.embedding",
+                        "post_process_function": "connector.post_process.cohere.embedding"
+                    }
+                ]
+            }
+            model_group_payload = {
+                "name": f"cohere_model_group_{int(time.time())}",
+                "description": "Model group for Cohere models"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            print("\nPlease enter your connector details as a JSON object.")
+            connector_payload = self.get_custom_json_input()
+            if not connector_payload:
+                return
+
+            print("\nPlease enter your model group details as a JSON object.")
+            model_group_payload = self.get_custom_json_input()
+            if not model_group_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the connector
+        try:
+            connector_response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/connectors/_create",
+                body=connector_payload
+            )
+            connector_id = connector_response.get('connector_id')
+            if not connector_id:
+                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
+            return
+
+        # Create model group
+        try:
+            model_group_response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/model_groups/_register",
+                body=model_group_payload
+            )
+            model_group_id = model_group_response.get('model_group_id')
+            if not model_group_id:
+                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
+            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
+                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
+                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            else:
+                return
+
+        # Create model payload
+        model_payload = {
+            "name": connector_payload.get('name', 'Cohere embedding model'),
+            "function_name": "REMOTE",
+            "model_group_id": model_group_id,
+            "description": connector_payload.get('description', 'Cohere embedding model for semantic search'),
+            "connector_id": connector_id
+        }
+
+        # Register the model
+        try:
+            response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = self.opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    self.config['embedding_model_id'] = model_id
+                    self.save_config(self.config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def register_openai_model_opensource(self):
+        """
+        Register an OpenAI embedding model in open-source OpenSearch.
+        """
+        openai_api_key = input("Enter your OpenAI API key: ").strip()
+        if not openai_api_key:
+            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
+            return
+
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            connector_payload = {
+                "name": "OpenAI Embedding Connector",
+                "description": "Connector for OpenAI embedding model",
+                "version": "1",
+                "protocol": "http",
+                "parameters": {
+                    "model": "text-embedding-ada-002"
+                },
+                "credential": {
+                    "openAI_key": openai_api_key
+                },
+                "actions": [
+                    {
+                        "action_type": "predict",
+                        "method": "POST",
+                        "url": "https://api.openai.com/v1/embeddings",
+                        "headers": {
+                            "Authorization": "Bearer ${credential.openAI_key}",
+                            "Content-Type": "application/json"
+                        },
+                        "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                        "pre_process_function": "connector.pre_process.openai.embedding",
+                        "post_process_function": "connector.post_process.openai.embedding"
+                    }
+                ]
+            }
+            model_group_payload = {
+                "name": f"openai_model_group_{int(time.time())}",
+                "description": "Model group for OpenAI models"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            print("\nPlease enter your connector details as a JSON object.")
+            connector_payload = self.get_custom_json_input()
+            if not connector_payload:
+                return
+
+            print("\nPlease enter your model group details as a JSON object.")
+            model_group_payload = self.get_custom_json_input()
+            if not model_group_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the connector
+        try:
+            connector_response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/connectors/_create",
+                body=connector_payload
+            )
+            connector_id = connector_response.get('connector_id')
+            if not connector_id:
+                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
+            return
+
+        # Create model group
+        try:
+            model_group_response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/model_groups/_register",
+                body=model_group_payload
+            )
+            model_group_id = model_group_response.get('model_group_id')
+            if not model_group_id:
+                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
+            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
+                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
+                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            else:
+                return
+
+        # Create model payload
+        model_payload = {
+            "name": connector_payload.get('name', 'OpenAI embedding model'),
+            "function_name": "REMOTE",
+            "model_group_id": model_group_id,
+            "description": connector_payload.get('description', 'OpenAI embedding model for semantic search'),
+            "connector_id": connector_id
+        }
+
+        # Register the model
+        try:
+            response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = self.opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    self.config['embedding_model_id'] = model_id
+                    self.save_config(self.config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def get_custom_json_input(self):
+        """Helper method to get custom JSON input from the user."""
+        json_input = input("Enter your JSON object: ").strip()
+        try:
+            return json.loads(json_input)
+        except json.JSONDecodeError as e:
+            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+            return None
+
+
+    def get_model_id_from_task(self, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+        """
+        import time
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = self.opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
+
+    def register_huggingface_model(self):
+        """
+        Register a Hugging Face Transformers model in open-source OpenSearch.
+        """
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            model_name = "sentence-transformers/all-MiniLM-L6-v2"
+            model_payload = {
+                "name": f"huggingface_{model_name.split('/')[-1]}",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": self.embedding_dimension,
+                    "framework_type": "SENTENCE_TRANSFORMERS",
+                    "model_type": "bert",
+                    "embedding_model": model_name
+                },
+                "description": f"Hugging Face Transformers model: {model_name}"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            model_name = input("Enter the Hugging Face model ID (e.g., 'sentence-transformers/all-MiniLM-L6-v2'): ").strip()
+            if not model_name:
+                print(f"{Fore.RED}Model ID is required. Aborting.{Style.RESET_ALL}")
+                return
+
+            print("\nPlease enter your model details as a JSON object.")
+            print("Example:")
+            example_payload = {
+                "name": f"huggingface_{model_name.split('/')[-1]}",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": self.embedding_dimension,
+                    "framework_type": "SENTENCE_TRANSFORMERS",
+                    "model_type": "bert",
+                    "embedding_model": model_name
+                },
+                "description": f"Hugging Face Transformers model: {model_name}"
+            }
+            print(json.dumps(example_payload, indent=2))
+            
+            model_payload = self.get_custom_json_input()
+            if not model_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the model
+        try:
+            response = self.opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = self.opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    self.config['embedding_model_id'] = model_id
+                    self.save_config(self.config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def wait_for_model_registration(self, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+        """
+        import time
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = self.opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
+
+def register_custom_pytorch_model(self):
+    """
+    Register a custom PyTorch model in open-source OpenSearch.
+    """
+    print("\nDo you want to use the default configuration or provide custom settings?")
+    print("1. Use default configuration")
+    print("2. Provide custom settings")
+    config_choice = input("Enter your choice (1-2): ").strip()
+
+    if config_choice == '1':
+        # Use default configurations
+        model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+        if not os.path.isfile(model_path):
+            print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+            return
+
+        model_name = os.path.basename(model_path).split('.')[0]
+        model_payload = {
+            "name": f"custom_pytorch_{model_name}",
+            "model_format": "TORCH_SCRIPT",
+            "model_config": {
+                "embedding_dimension": self.embedding_dimension,
+                "framework_type": "CUSTOM",
+                "model_type": "bert"
+            },
+            "description": f"Custom PyTorch model: {model_name}"
+        }
+    elif config_choice == '2':
+        # Get custom configurations
+        model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+        if not os.path.isfile(model_path):
+            print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+            return
+
+        print("\nPlease enter your model details as a JSON object.")
+        print("Example:")
+        example_payload = {
+            "name": "custom_pytorch_model",
+            "model_format": "TORCH_SCRIPT",
+            "model_config": {
+                "embedding_dimension": self.embedding_dimension,
+                "framework_type": "CUSTOM",
+                "model_type": "bert"
+            },
+            "description": "Custom PyTorch model for semantic search"
+        }
+        print(json.dumps(example_payload, indent=2))
+        
+        model_payload = self.get_custom_json_input()
+        if not model_payload:
+            return
+    else:
+        print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+        return
+
+    # Upload the model file to OpenSearch
+    try:
+        with open(model_path, 'rb') as f:
+            model_content = f.read()
+
+        # Use the ML plugin's model upload API
+        upload_response = self.opensearch_client.transport.perform_request(
+            method="POST",
+            url="/_plugins/_ml/models/_upload",
+            params={"model_name": model_payload['name']},
+            body=model_content,
+            headers={'Content-Type': 'application/octet-stream'}
+        )
+        if 'model_id' not in upload_response:
+            print(f"{Fore.RED}Failed to upload model. Response: {upload_response}{Style.RESET_ALL}")
+            return
+        model_id = upload_response['model_id']
+        print(f"{Fore.GREEN}Model uploaded successfully. Model ID: {model_id}{Style.RESET_ALL}")
+    except Exception as ex:
+        print(f"{Fore.RED}Error uploading model: {ex}{Style.RESET_ALL}")
+        return
+
+    # Add the model_id to the payload
+    model_payload['model_id'] = model_id
+
+    # Register the model
+    try:
+        response = self.opensearch_client.transport.perform_request(
+            method="POST",
+            url="/_plugins/_ml/models/_register",
+            body=model_payload
+        )
+        task_id = response.get('task_id')
+        if task_id:
+            print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+            # Wait for the task to complete and retrieve the model_id
+            registered_model_id = self.wait_for_model_registration(task_id)
+            if registered_model_id:
+                # Deploy the model
+                deploy_response = self.opensearch_client.transport.perform_request(
+                    method="POST",
+                    url=f"/_plugins/_ml/models/{registered_model_id}/_deploy"
+                )
+                print(f"{Fore.GREEN}Model deployed successfully. Model ID: {registered_model_id}{Style.RESET_ALL}")
+                self.config['embedding_model_id'] = registered_model_id
+                self.save_config(self.config)
+            else:
+                print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+        else:
+            print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+    except Exception as ex:
+        print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 73b23a7b..3e3ec1d8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -39,34 +38,41 @@ def __init__(self, config):
         self.opensearch_endpoint = config.get('opensearch_endpoint')
         self.opensearch_username = config.get('opensearch_username')
         self.opensearch_password = config.get('opensearch_password')
+        self.service_type = config.get('service_type')
 
     def initialize_opensearch_client(self):
         # Initialize the OpenSearch client
-        # Handles both serverless and non-serverless configurations
-        # Returns True if successful, False otherwise
         if not self.opensearch_endpoint:
             print("OpenSearch endpoint not set. Please run setup first.")
             return False
-        
+
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = parsed_url.port or 443
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
-        if self.is_serverless:
+        if self.service_type == 'serverless':
             credentials = boto3.Session().get_credentials()
             auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
-        else:
+        elif self.service_type == 'managed':
             if not self.opensearch_username or not self.opensearch_password:
                 print("OpenSearch username or password not set. Please run setup first.")
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
+        elif self.service_type == 'open-source':
+            if self.opensearch_username and self.opensearch_password:
+                auth = (self.opensearch_username, self.opensearch_password)
+            else:
+                auth = None  # No authentication
+        else:
+            print("Invalid service type. Please check your configuration.")
+            return False
 
         try:
             self.opensearch_client = OpenSearch(
                 hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
-                use_ssl=True,
-                verify_certs=True,
+                use_ssl=parsed_url.scheme == 'https',
+                verify_certs=False if parsed_url.scheme == 'https' else True,
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
@@ -77,12 +83,11 @@ def initialize_opensearch_client(self):
             return False
 
     def create_index(self, embedding_dimension, space_type):
-        # Create a new KNN index in OpenSearch
-        # Sets up the mapping for nominee_text and nominee_vector fields
         index_body = {
             "mappings": {
                 "properties": {
                     "nominee_text": {"type": "text"},
+                    "passage_chunk": {"type": "text"},
                     "nominee_vector": {
                         "type": "knn_vector",
                         "dimension": embedding_dimension,
@@ -138,19 +143,18 @@ def bulk_index(self, actions):
             print(f"Error during bulk indexing: {e}")
             return 0, len(actions)
 
-    def search(self, vector, k=5):
-        # Perform a KNN search using the provided vector
-        # Returns the top k matching documents
+    def search(self, query_text, model_id, k=5):
         try:
             response = self.opensearch_client.search(
                 index=self.index_name,
                 body={
                     "size": k,
-                    "_source": ["nominee_text"],
+                    "_source": ["passage_chunk"],
                     "query": {
-                        "knn": {
+                        "neural": {
                             "nominee_vector": {
-                                "vector": vector,
+                                "query_text": query_text,
+                                "model_id": model_id,
                                 "k": k
                             }
                         }
@@ -161,3 +165,11 @@ def search(self, vector, k=5):
         except Exception as e:
             print(f"Error during search: {e}")
             return []
+
+    def check_connection(self):
+        try:
+            self.opensearch_client.info()
+            return True
+        except Exception as e:
+            print(f"Error connecting to OpenSearch: {e}")
+            return False
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 40c48c85..d1092203 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -24,216 +23,132 @@
 #  under the License.
 
 import json
-import tiktoken
 from colorama import Fore, Style, init
 from typing import List
-import boto3
-import botocore
-import time
-import random
 from opensearch_connector import OpenSearchConnector
+import requests
+import os
+import urllib3
+
+urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
 
 init(autoreset=True)  # Initialize colorama
 
 class Query:
-    LLM_MODEL_ID = 'amazon.titan-text-express-v1'
-
     def __init__(self, config):
         # Initialize the Query class with configuration
         self.config = config
-        self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
-        self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
         self.embedding_model_id = config.get('embedding_model_id')
-    def initialize_clients(self):
-        # Initialize AWS Bedrock and OpenSearch clients
-        # Returns True if successful, False otherwise
-        try:
-            self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
-            if self.opensearch.initialize_opensearch_client():
-                print("Clients initialized successfully.")
-                return True
-            else:
-                print("Failed to initialize OpenSearch client.")
-                return False
-        except Exception as e:
-            print(f"Failed to initialize clients: {e}")
-            return False
 
-    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
-        if self.opensearch is None:
-            print("OpenSearch client is not initialized. Please run setup first.")
-            return None
-
-        delay = initial_delay
-        for attempt in range(max_retries):
-            try:
-                payload = {
-                    "text_docs": [text]
-                }
-                response = self.opensearch.opensearch_client.transport.perform_request(
-                    method="POST",
-                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
-                    body=payload
-                )
-                inference_results = response.get('inference_results', [])
-                if not inference_results:
-                    print(f"No inference results returned for text: {text}")
-                    return None
-                output = inference_results[0].get('output')
-
-                # Adjust the extraction of embedding data
-                if isinstance(output, list) and len(output) > 0:
-                    embedding_dict = output[0]
-                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
-                        embedding = embedding_dict['data']
-                    else:
-                        print(f"Unexpected embedding output format: {output}")
-                        return None
-                elif isinstance(output, dict) and 'data' in output:
-                    embedding = output['data']
-                else:
-                    print(f"Unexpected embedding output format: {output}")
-                    return None
+        # Initialize OpenSearch client
+        if not self.initialize_clients():
+            print("Failed to initialize clients. Aborting.")
+            return
 
-                # Verify that embedding is a list of floats
-                if not isinstance(embedding, list) or not all(isinstance(x, (float, int)) for x in embedding):
-                    print(f"Embedding is not a list of floats: {embedding}")
-                    return None
+        # Check OpenSearch connection
+        if not self.opensearch.check_connection():
+            print("Failed to connect to OpenSearch. Please check your configuration.")
+            return
 
-                # Optionally, remove debugging print statements
-                # print(f"Extracted embedding of length {len(embedding)}")
-                return embedding
-            except Exception as ex:
-                print(f"Error on attempt {attempt + 1}: {ex}")
-                if attempt == max_retries - 1:
-                    raise
-                time.sleep(delay)
-                delay *= backoff_factor
-        return None
+    def initialize_clients(self):
+        # Initialize OpenSearch client only
+        if self.opensearch.initialize_opensearch_client():
+            print("OpenSearch client initialized successfully.")
+            return True
+        else:
+            print("Failed to initialize OpenSearch client.")
+            return False
 
     def bulk_query(self, queries, k=5):
-        # Perform bulk semantic search for multiple queries
-        # Generates embeddings for queries and searches OpenSearch index
-        # Returns a list of results containing query, context, and number of results
-        print("Generating embeddings for queries...")
-        query_vectors = []
-        for query in queries:
-            embedding = self.text_embedding(query)
-            if embedding:
-                query_vectors.append(embedding)
-            else:
-                print(f"{Fore.RED}Failed to generate embedding for query: {query}{Style.RESET_ALL}")
-                query_vectors.append(None)
-        
         print("Performing bulk semantic search...")
+
         results = []
-        for i, vector in enumerate(query_vectors):
-            if vector is None:
-                results.append({
-                    'query': queries[i],
-                    'context': "",
-                    'num_results': 0
-                })
-                continue
+        for query_text in queries:
             try:
-                hits = self.opensearch.search(vector, k)
-                context = '\n'.join([hit['_source']['nominee_text'] for hit in hits])
+                hits = self.opensearch.search(query_text, self.embedding_model_id, k)
+                if hits:
+                    # Collect the content from the retrieved documents
+                    documents = []
+                    for hit in hits:
+                        source = hit['_source']
+                        document = {
+                            'score': hit['_score'],
+                            'source': source
+                        }
+                        documents.append(document)
+                    num_results = len(hits)
+                else:
+                    documents = []
+                    num_results = 0
+                    print(f"{Fore.YELLOW}Warning: No hits found for query '{query_text}'.{Style.RESET_ALL}")
+
                 results.append({
-                    'query': queries[i],
-                    'context': context,
-                    'num_results': len(hits)
+                    'query': query_text,
+                    'documents': documents,
+                    'num_results': num_results
                 })
             except Exception as ex:
-                print(f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}")
+                print(f"{Fore.RED}Error performing search for query '{query_text}': {str(ex)}{Style.RESET_ALL}")
                 results.append({
-                    'query': queries[i],
-                    'context': "",
+                    'query': query_text,
+                    'documents': [],
                     'num_results': 0
                 })
-        
+
         return results
 
-    def generate_answer(self, prompt, config):
-        # Generate an answer using the LLM model
-        # Handles token limit and configures LLM parameters
-        # Returns the generated answer or None if an error occurs
-        try:
-            max_input_tokens = 8192  # Max tokens for the model
-            expected_output_tokens = config.get('maxTokenCount', 1000)
-            encoding = tiktoken.get_encoding("cl100k_base")  # Use appropriate encoding
-
-            prompt_tokens = encoding.encode(prompt)
-            allowable_input_tokens = max_input_tokens - expected_output_tokens
-
-            if len(prompt_tokens) > allowable_input_tokens:
-                # Truncate the prompt to fit within the model's token limit
-                prompt_tokens = prompt_tokens[:allowable_input_tokens]
-                prompt = encoding.decode(prompt_tokens)
-                print(f"Prompt truncated to {allowable_input_tokens} tokens.")
-
-            # Simplified LLM config with only supported parameters
-            llm_config = {
-                'maxTokenCount': expected_output_tokens,
-                'temperature': config.get('temperature', 0.7),
-                'topP': config.get('topP', 1.0),
-                'stopSequences': config.get('stopSequences', [])
-            }
-
-            body = json.dumps({
-                'inputText': prompt,
-                'textGenerationConfig': llm_config
-            })
-            response = self.bedrock_client.invoke_model(modelId=self.LLM_MODEL_ID, body=body)
-            response_body = json.loads(response['body'].read())
-            results = response_body.get('results', [])
-            if not results:
-                print("No results returned from LLM.")
-                return None
-            answer = results[0].get('outputText', '').strip()
-            return answer
-        except Exception as ex:
-            print(f"Error generating answer from LLM: {ex}")
-            return None
 
+    def extract_relevant_sentences(self, query, text):
+        # Lowercase and remove punctuation from query
+        query_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in query)
+        query_words = set(query_processed.split())
+
+        # Split text into sentences based on punctuation and newlines
+        import re
+        sentences = re.split(r'[\n.!?]+', text)
+
+        sentence_scores = []
+        for sentence in sentences:
+            sentence = sentence.strip()
+            if not sentence:
+                continue
+            # Lowercase and remove punctuation from sentence
+            sentence_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in sentence)
+            sentence_words = set(sentence_processed.split())
+            common_words = query_words.intersection(sentence_words)
+            score = len(common_words) / (len(query_words) + 1e-6)  # Normalized score
+            if score > 0:
+                sentence_scores.append((score, sentence))
+
+        # Sort sentences by score in descending order
+        sentence_scores.sort(reverse=True)
+
+        # Return the sentences with highest scores
+        top_sentences = [sentence for score, sentence in sentence_scores]
+        return top_sentences
     def query_command(self, queries: List[str], num_results=5):
-        # Main query command to process multiple queries
-        # Performs semantic search and generates answers using LLM
-        # Prints results for each query
-        if not self.initialize_clients():
-            print("Failed to initialize clients. Aborting query.")
-            return
-        
         results = self.bulk_query(queries, k=num_results)
-        
-        llm_config = {
-            "maxTokenCount": 1000,
-            "temperature": 0.7,
-            "topP": 0.9,
-            "stopSequences": []
-        }
-        
+
         for result in results:
             print(f"\nQuery: {result['query']}")
-            print(f"Found {result['num_results']} results.")
-            
-            if not result['context']:
-                print(f"{Fore.RED}No context available for this query.{Style.RESET_ALL}")
-                continue
-            
-            augmented_prompt = f"""Context: {result['context']}
-Based on the above context, please provide a detailed and insightful answer to the following question. Feel free to make reasonable inferences or connections if the context doesn't provide all the information:
-
-Question: {result['query']}
-
-Answer:"""
-        
-            print("Generating answer using LLM...")
-            answer = self.generate_answer(augmented_prompt, llm_config)
-        
-            if answer:
-                print("Generated Answer:")
-                print(answer)
+            if result['documents']:
+                all_relevant_sentences = []
+                for doc in result['documents']:
+                    passage_chunks = doc['source'].get('passage_chunk', [])
+                    if not passage_chunks:
+                        continue
+                    for passage in passage_chunks:
+                        relevant_sentences = self.extract_relevant_sentences(result['query'], passage)
+                        all_relevant_sentences.extend(relevant_sentences)
+
+                if all_relevant_sentences:
+                    # Output the top relevant sentences
+                    print("Answer:")
+                    for sentence in all_relevant_sentences[:1]:  # Display the top sentence
+                        print(sentence)
+                else:
+                    print("No relevant sentences found.")
             else:
-                print("Failed to generate an answer.")
+                print("No documents found for this query.")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 0e86bf15..e4d51b04 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -25,7 +25,7 @@
 # under the License.
 
 """
-Main CLI script for OpenSearch with Bedrock Integration
+Main CLI script for OpenSearch PY ML
 """
 
 import argparse
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 983ef7e9..ee8aa66f 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -37,7 +36,9 @@
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
 from AIConnectorHelper import AIConnectorHelper
+from model_register import ModelRegister
 from colorama import Fore, Style, init
+import ssl
 
 init(autoreset=True)
 class Setup:
@@ -46,20 +47,21 @@ class Setup:
     SERVICE_BEDROCK = 'bedrock-runtime'
 
     def __init__(self):
-            # Initialize setup variables
-            self.config = self.load_config()
-            self.aws_region = self.config.get('region')
-            self.iam_principal = self.config.get('iam_principal')
-            self.index_name = self.config.get('index_name')
-            self.collection_name = self.config.get('collection_name', '')
-            self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
-            self.is_serverless = self.config.get('is_serverless', 'False') == 'True'
-            self.opensearch_username = self.config.get('opensearch_username', '')
-            self.opensearch_password = self.config.get('opensearch_password', '')
-            self.aoss_client = None
-            self.bedrock_client = None
-            self.opensearch_client = None
-            self.opensearch_domain_name = self.get_opensearch_domain_name()
+        # Initialize setup variables
+        self.config = self.load_config()
+        self.aws_region = self.config.get('region')
+        self.iam_principal = self.config.get('iam_principal')
+        self.collection_name = self.config.get('collection_name', '')
+        self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
+        self.service_type = self.config.get('service_type', 'managed')
+        self.is_serverless = self.service_type == 'serverless'
+        self.opensearch_username = self.config.get('opensearch_username', '')
+        self.opensearch_password = self.config.get('opensearch_password', '')
+        self.aoss_client = None
+        self.bedrock_client = None
+        self.opensearch_client = None
+        self.opensearch_domain_name = self.get_opensearch_domain_name()
+        self.model_register = None
 
     def check_and_configure_aws(self):
         # Check if AWS credentials are configured and offer to reconfigure if needed
@@ -170,7 +172,6 @@ def get_password_with_asterisks(self, prompt="Enter password: "):
                         sys.stdout.flush()
             finally:
                 termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
-
     def setup_configuration(self):
         # Set up the configuration by prompting the user for various settings
         config = self.load_config()
@@ -178,28 +179,54 @@ def setup_configuration(self):
         self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
         self.iam_principal = input(f"Enter your IAM Principal ARN [{config.get('iam_principal', '')}]: ") or config.get('iam_principal', '')
 
-        service_type = input("Choose OpenSearch service type (1 for Serverless, 2 for Managed): ")
-        self.is_serverless = service_type == '1'
+        print("Choose OpenSearch service type:")
+        print("1. Serverless")
+        print("2. Managed")
+        print("3. Open-source")
+        service_choice = input("Enter your choice (1-3): ")
+
+        if service_choice == '1':
+            self.service_type = 'serverless'
+        elif service_choice == '2':
+            self.service_type = 'managed'
+        elif service_choice == '3':
+            self.service_type = 'open-source'
+        else:
+            print("Invalid choice. Defaulting to 'managed'")
+            self.service_type = 'managed'
 
-        if self.is_serverless:
-            self.index_name = input("Enter a name for your KNN index in OpenSearch: ")
+        if self.service_type == 'serverless':
             self.collection_name = input("Enter the name for your OpenSearch collection: ")
             self.opensearch_endpoint = None
             self.opensearch_username = None
             self.opensearch_password = None
-        else:
-            self.index_name = input("Enter a name for your KNN index in OpenSearch: ")
+        elif self.service_type == 'managed':
             self.opensearch_endpoint = input("Enter your OpenSearch domain endpoint: ")
             self.opensearch_username = input("Enter your OpenSearch username: ")
             self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
             self.collection_name = ''
+        elif self.service_type == 'open-source':
+            # For open-source, allow default endpoint
+            default_endpoint = 'https://localhost:9200'
+            self.opensearch_endpoint = input(f"Press Enter to use the default endpoint(or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
+            auth_required = input("Does your OpenSearch instance require authentication? (yes/no): ").strip().lower()
+            if auth_required == 'yes':
+                self.opensearch_username = input("Enter your OpenSearch username: ")
+                self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
+            else:
+                self.opensearch_username = None
+                self.opensearch_password = None
+            self.collection_name = ''
+            # For open-source, we may not need AWS region and IAM principal
+            self.aws_region = ''
+            self.iam_principal = ''
 
+        # Remove index_name from configuration at this point
         self.config = {
             'region': self.aws_region,
             'iam_principal': self.iam_principal,
-            'index_name': self.index_name,
             'collection_name': self.collection_name if self.collection_name else '',
-            'is_serverless': str(self.is_serverless),
+            'service_type': self.service_type,
             'opensearch_endpoint': self.opensearch_endpoint if self.opensearch_endpoint else '',
             'opensearch_username': self.opensearch_username if self.opensearch_username else '',
             'opensearch_password': self.opensearch_password if self.opensearch_password else ''
@@ -412,10 +439,10 @@ def initialize_opensearch_client(self):
         if not self.opensearch_endpoint:
             print("OpenSearch endpoint not set. Please run setup first.")
             return False
-        
+
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = 443
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
         if self.is_serverless:
             credentials = boto3.Session().get_credentials()
@@ -426,12 +453,25 @@ def initialize_opensearch_client(self):
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
 
+        use_ssl = parsed_url.scheme == 'https'
+        verify_certs = False if use_ssl else True
+
+        # Create an SSL context that does not verify certificates
+        if use_ssl and not verify_certs:
+            ssl_context = ssl.create_default_context()
+            ssl_context.check_hostname = False
+            ssl_context.verify_mode = ssl.CERT_NONE
+        else:
+            ssl_context = None
+
         try:
             self.opensearch_client = OpenSearch(
                 hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
-                use_ssl=True,
-                verify_certs=True,
+                use_ssl=use_ssl,
+                verify_certs=verify_certs,
+                ssl_show_warn=False,          # Suppress SSL warnings
+                ssl_context=ssl_context,      # Use the custom SSL context
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
@@ -551,15 +591,14 @@ def get_truncated_name(self, base_name, max_length=32):
         return base_name[:max_length-3] + "..."
 
     def setup_command(self):
-        # Main setup command that orchestrates the entire setup process
         self.check_and_configure_aws()
         self.setup_configuration()
         
-        if not self.initialize_clients():
+        if self.service_type != 'open-source' and not self.initialize_clients():
             print(f"{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}")
             return
         
-        if self.is_serverless:
+        if self.service_type == 'serverless':
             self.create_security_policies()
             collection_id = self.get_collection_id(self.collection_name)
             if not collection_id:
@@ -575,404 +614,100 @@ def setup_command(self):
                     else:
                         self.config['opensearch_endpoint'] = self.opensearch_endpoint
                         self.save_config(self.config)
-                        # Initialize opensearch_domain_name after setting opensearch_endpoint
                         self.opensearch_domain_name = self.get_opensearch_domain_name()
                 else:
                     print(f"{Fore.RED}Collection is not active. Setup incomplete.{Style.RESET_ALL}")
                     return
-        else:
+        elif self.service_type == 'managed':
             if not self.opensearch_endpoint:
                 print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}")
                 return
             else:
-                # Initialize opensearch_domain_name after setting opensearch_endpoint
                 self.opensearch_domain_name = self.get_opensearch_domain_name()
-        
+        elif self.service_type == 'open-source':
+            # Open-source setup
+            if not self.opensearch_endpoint:
+                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}")
+                return
+            else:
+                self.opensearch_domain_name = None  # Not required for open-source
+
+        # Initialize OpenSearch client
         if self.initialize_opensearch_client():
-            print(f"{Fore.GREEN}OpenSearch client initialized successfully. Proceeding with index creation...{Style.RESET_ALL}")
-            embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
-            if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
-                print(f"{Fore.GREEN}KNN index setup completed successfully.{Style.RESET_ALL}")
-                self.config['embedding_dimension'] = str(embedding_dimension)
-                self.config['space_type'] = space_type
-                self.config['ef_construction'] = str(ef_construction)
+            print(f"{Fore.GREEN}OpenSearch client initialized successfully.{Style.RESET_ALL}")
+            
+            # Prompt user to choose between creating a new index or using an existing one
+            print("\nDo you want to create a new KNN index or use an existing one?")
+            print("1. Create a new KNN index")
+            print("2. Use an existing KNN index")
+            index_choice = input("Enter your choice (1-2): ").strip()
+            
+            if index_choice == '1':
+                # Proceed to create a new index
+                self.index_name = input("Enter a name for your new KNN index in OpenSearch: ").strip()
+        
+                # Save the index name in the configuration
+                self.config['index_name'] = self.index_name
                 self.save_config(self.config)
-                config_file_path = os.path.abspath(self.CONFIG_FILE)
-                print(f"{Fore.GREEN}Configuration saved successfully at {config_file_path}{Style.RESET_ALL}")
+        
+                print("Proceeding with index creation...")
+                embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
                 
-                # Ask the user if they want to register a model
-                self.prompt_model_registration()
-            else:
-                print(f"{Fore.RED}Index verification failed. Please check your index name and permissions.{Style.RESET_ALL}")
-        else:
-            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}")
-
-    def prompt_model_registration(self):
-        """
-        Prompt the user to register a model or input an existing model ID.
-        """
-        print("\nWould you like to register an embedding model now?")
-        print("1. Yes, register a new model")
-        print("2. No, I already have a model ID")
-        print("3. Skip this step")
-        choice = input("Enter your choice (1-2): ").strip()
-
-        if choice == '1':
-            self.register_model_interactive()
-        elif choice == '2':
-            model_id = input("Please enter your existing embedding model ID: ").strip()
-            if model_id:
-                self.config['embedding_model_id'] = model_id
+                if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
+                    print(f"{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}")
+                    # Save index details to config
+                    self.config['embedding_dimension'] = str(embedding_dimension)
+                    self.config['space_type'] = space_type
+                    self.config['ef_construction'] = str(ef_construction)
+                    self.save_config(self.config)
+                else:
+                    print(f"{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}")
+                    return
+            elif index_choice == '2':
+                # Use existing index
+                existing_index_name = input("Enter the name of your existing KNN index: ").strip()
+                if not existing_index_name:
+                    print(f"{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}")
+                    return
+                self.index_name = existing_index_name
+                self.config['index_name'] = self.index_name
                 self.save_config(self.config)
-                print(f"{Fore.GREEN}Model ID '{model_id}' saved successfully in configuration.{Style.RESET_ALL}")
+                # Load index details from config or prompt for them
+                if 'embedding_dimension' in self.config and 'space_type' in self.config and 'ef_construction' in self.config:
+                    embedding_dimension = int(self.config['embedding_dimension'])
+                    space_type = self.config['space_type']
+                    ef_construction = int(self.config['ef_construction'])
+                    print(f"Using existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.")
+                else:
+                    print("Index details not found in configuration.")
+                    embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
+                    # Save index details to config
+                    self.config['embedding_dimension'] = str(embedding_dimension)
+                    self.config['space_type'] = space_type
+                    self.config['ef_construction'] = str(ef_construction)
+                    self.save_config(self.config)
+                # Verify that the index exists
+                if not self.opensearch_client.indices.exists(index=self.index_name):
+                    print(f"{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}")
+                    return
             else:
-                print(f"{Fore.RED}No model ID provided. Skipping model registration.{Style.RESET_ALL}")
-        else:
-            print("Skipping model registration.")
-
-    def register_model_interactive(self):
-        """
-        Interactive method to register a new embedding model during setup.
-        """
-        # Load existing config
-        self.config = self.load_config()
-
-        # Initialize clients
-        if not self.initialize_clients():
-            print(f"{Fore.RED}Failed to initialize AWS clients. Cannot proceed.{Style.RESET_ALL}")
-            return
-
-        # Ensure opensearch_endpoint is set
-        if not self.opensearch_endpoint:
-            self.opensearch_endpoint = self.config.get('opensearch_endpoint')
-            if not self.opensearch_endpoint:
-                print(f"{Fore.RED}OpenSearch endpoint not set. Please run 'setup' command first.{Style.RESET_ALL}")
+                print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}")
                 return
 
-        # Initialize opensearch_domain_name
-        self.opensearch_domain_name = self.get_opensearch_domain_name()
-
-        # Extract the IAM user name from the IAM principal ARN
-        aws_user_name = self.get_iam_user_name_from_arn(self.iam_principal)
-
-        if not aws_user_name:
-            print("Could not extract IAM user name from IAM principal ARN.")
-            aws_user_name = input("Enter your AWS IAM user name: ")
-
-        # Instantiate AIConnectorHelper
-        helper = AIConnectorHelper(
-            region=self.aws_region,
-            opensearch_domain_name=self.opensearch_domain_name,
-            opensearch_domain_username=self.opensearch_username,
-            opensearch_domain_password=self.opensearch_password,
-            aws_user_name=aws_user_name,
-            aws_role_name=None  # Set to None or provide if applicable
-        )
-
-        # Prompt user to select a model
-        print("Please select an embedding model to register:")
-        print("1. Bedrock Titan Embedding Model")
-        print("2. SageMaker Embedding Model")
-        print("3. Cohere Embedding Model")
-        print("4. OpenAI Embedding Model")
-        model_choice = input("Enter your choice (1-4): ")
-
-        # Call the appropriate method based on the user's choice
-        if model_choice == '1':
-            self.register_bedrock_model(helper)
-        elif model_choice == '2':
-            self.register_sagemaker_model(helper)
-        elif model_choice == '3':
-            self.register_cohere_model(helper)
-        elif model_choice == '4':
-            self.register_openai_model(helper)
+            # Proceed with model registration
+            # Initialize ModelRegister now that OpenSearch client and domain name are available
+            self.model_register = ModelRegister(
+                self.config,
+                self.opensearch_client,
+                self.opensearch_domain_name
+            )
+            
+            # Model Registration
+            if self.service_type != 'open-source':
+                # AWS-managed OpenSearch: Proceed with model registration
+                self.model_register.prompt_model_registration()
+            else:
+                # Open-source OpenSearch: Provide instructions or automate model registration
+                self.model_register.prompt_opensource_model_registration()
         else:
-            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
-            return
-        
-    def register_bedrock_model(self, helper):
-        """
-        Register a Bedrock embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
-        connector_role_name = "my_test_bedrock_connector_role"
-        create_connector_role_name = "my_test_create_bedrock_connector_role"
-
-        # Set up connector role inline policy
-        connector_role_inline_policy = {
-            "Version": "2012-10-17",
-            "Statement": [
-                {
-                    "Action": ["bedrock:InvokeModel"],
-                    "Effect": "Allow",
-                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
-                }
-            ]
-        }
-
-        # Create connector input
-        create_connector_input = {
-            "name": "Amazon Bedrock Connector: titan embedding v1",
-            "description": "The connector to Bedrock Titan embedding model",
-            "version": 1,
-            "protocol": "aws_sigv4",
-            "parameters": {
-                "region": bedrock_region,
-                "service_name": "bedrock"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
-                    "headers": {
-                        "content-type": "application/json",
-                        "x-amz-content-sha256": "required"
-                    },
-                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
-                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
-                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
-                }
-            ]
-        }
-
-        # Create connector
-        print("Creating connector...")
-        connector_id = helper.create_connector_with_role(
-            connector_role_inline_policy,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        print("Registering model...")
-        model_name = 'Bedrock embedding model'
-        description = 'Bedrock embedding model for semantic search'
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
-
-
-    def register_sagemaker_model(self, helper):
-        """
-        Register a SageMaker embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ")
-        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ")
-        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ") or self.aws_region
-        connector_role_name = "my_test_sagemaker_connector_role"
-        create_connector_role_name = "my_test_create_sagemaker_connector_role"
-
-        # Set up connector role inline policy
-        connector_role_inline_policy = {
-            "Version": "2012-10-17",
-            "Statement": [
-                {
-                    "Action": ["sagemaker:InvokeEndpoint"],
-                    "Effect": "Allow",
-                    "Resource": sagemaker_endpoint_arn
-                }
-            ]
-        }
-
-        # Create connector input
-        create_connector_input = {
-            "name": "SageMaker embedding model connector",
-            "description": "Connector for my SageMaker embedding model",
-            "version": "1.0",
-            "protocol": "aws_sigv4",
-            "parameters": {
-                "region": sagemaker_region,
-                "service_name": "sagemaker"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "headers": {
-                        "content-type": "application/json"
-                    },
-                    "url": sagemaker_endpoint_url,
-                    "request_body": "${parameters.input}",
-                    "pre_process_function": "connector.pre_process.default.embedding",
-                    "post_process_function": "connector.post_process.default.embedding"
-                }
-            ]
-        }
-
-        # Create connector
-        connector_id = helper.create_connector_with_role(
-            connector_role_inline_policy,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = 'SageMaker embedding model'
-        description = 'SageMaker embedding model for semantic search'
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
-
-
-    def register_cohere_model(self, helper):
-        """
-        Register a Cohere embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'cohere_api_key'
-        cohere_api_key = input("Enter your Cohere API key: ")
-        secret_value = {secret_key: cohere_api_key}
-
-        connector_role_name = "my_test_cohere_connector_role"
-        create_connector_role_name = "my_test_create_cohere_connector_role"
-
-        # Create connector input
-        create_connector_input = {
-            "name": "Cohere Embedding Model Connector",
-            "description": "Connector for Cohere embedding model",
-            "version": "1.0",
-            "protocol": "http",
-            "parameters": {
-                "model": "embed-english-v3.0",
-                "input_type": "search_document",
-                "truncate": "END"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": "https://api.cohere.ai/v1/embed",
-                    "headers": {
-                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                        "Request-Source": "unspecified:opensearch"
-                    },
-                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
-                    "pre_process_function": "connector.pre_process.cohere.embedding",
-                    "post_process_function": "connector.post_process.cohere.embedding"
-                }
-            ]
-        }
-
-        # Create connector
-        connector_id = helper.create_connector_with_secret(
-            secret_name,
-            secret_value,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = 'Cohere embedding model'
-        description = 'Cohere embedding model for semantic search'
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
-
-
-    def register_openai_model(self, helper):
-        """
-        Register an OpenAI embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'openai_api_key'
-        openai_api_key = input("Enter your OpenAI API key: ")
-        secret_value = {secret_key: openai_api_key}
-
-        connector_role_name = "my_test_openai_connector_role"
-        create_connector_role_name = "my_test_create_openai_connector_role"
-
-        # Create connector input
-        create_connector_input = {
-            "name": "OpenAI Embedding Model Connector",
-            "description": "Connector for OpenAI embedding model",
-            "version": "1.0",
-            "protocol": "http",
-            "parameters": {
-                "model": "text-embedding-ada-002"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": "https://api.openai.com/v1/embeddings",
-                    "headers": {
-                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                    },
-                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
-                    "pre_process_function": "connector.pre_process.openai.embedding",
-                    "post_process_function": "connector.post_process.openai.embedding"
-                }
-            ]
-        }
-
-        # Create connector
-        connector_id = helper.create_connector_with_secret(
-            secret_name,
-            secret_value,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = 'OpenAI embedding model'
-        description = 'OpenAI embedding model for semantic search'
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
+            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}")
\ No newline at end of file

From fc2ace8b0bda2d0e6fa308773a7fb91caf7d82ee Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 28 Nov 2024 22:54:22 -0800
Subject: [PATCH 11/42] Remove requirements.txt and setup.py from Git tracking

- Remove requirements.txt and setup.py from Git repository
- Add these files to .gitignore to prevent future tracking
- Keep local copies of these files for development purposes

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/requirements.txt         |  9 ----
 .../ml_commons/rag_pipeline/rag/setup.py      | 47 -------------------
 2 files changed, 56 deletions(-)
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt b/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
deleted file mode 100644
index dc41b248..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/requirements.txt
+++ /dev/null
@@ -1,9 +0,0 @@
-boto3
-opensearch-py
-pandas
-configparser
-PyPDF2
-tiktoken
-tqdm
-colorama
-requests_aws4auth
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
deleted file mode 100644
index 1c806760..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/setup.py
+++ /dev/null
@@ -1,47 +0,0 @@
-# SPDX-License-Identifier: Apache-2.0
-# The OpenSearch Contributors require contributions made to
-# this file be licensed under the Apache-2.0 license or a
-# compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
-
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
-from setuptools import setup, find_packages, find_namespace_packages
-
-setup(
-    # Name of the package
-    name="rag_pipeline",
-    
-    # Version of the package
-    version="0.1.0",
-    
-    # Automatically find and include all packages in the project
-    # This specifically looks for packages within 'opensearch_py_ml' and its subpackages
-    packages=find_namespace_packages(include=['opensearch_py_ml', 'opensearch_py_ml.*']),
-    
-    # Define console script entry points
-    # This creates a command-line executable named 'rag' that runs the main() function
-    # from the opensearch_py_ml.ml_commons.rag_pipeline.rag module
-    entry_points={
-        'console_scripts': [
-            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
-        ],
-    },
-)

From fe83b25fc17e457b24ba8e805caf40dbc60b2062 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 28 Nov 2024 23:25:32 -0800
Subject: [PATCH 12/42] Update setup.py file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 setup.py | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/setup.py b/setup.py
index b1ecb39b..09a00558 100644
--- a/setup.py
+++ b/setup.py
@@ -25,10 +25,11 @@
 
 # flake8: noqa
 
-from setuptools import setup, find_packages, find_namespace_packages
 from codecs import open
 from os import path
 
+from setuptools import find_packages, setup
+
 here = path.abspath(path.dirname(__file__))
 about = {}
 with open(path.join(here, "opensearch_py_ml", "_version.py"), "r", "utf-8") as f:
@@ -70,30 +71,30 @@
     long_description_content_type="text/markdown",
     url=about["__url__"],
     author=about["__author__"],
-    author_email=about["__author_email"],
+    author_email=about["__author_email__"],
     maintainer=about["__maintainer__"],
-    maintainer_email=about["__maintainer_email"],
+    maintainer_email=about["__maintainer_email__"],
     license="Apache-2.0",
     classifiers=CLASSIFIERS,
     keywords="Opensearch opensearch_py_ml pandas python",
-    packages=find_namespace_packages(include=["opensearch_py_ml", "opensearch_py_ml.*"]),
+    packages=find_packages(include=["opensearch_py_ml", "opensearch_py_ml.*"]),
     project_urls={
         "Source Code": "https://github.com/opensearch-project/opensearch-py-ml",
         "Issue Tracker": "https://github.com/opensearch-project/opensearch-py-ml/issues",
     },
     install_requires=[
-        "opensearch-py>=2.2.0",
-        "pandas>=1.5.2,<3",
-        "matplotlib>=3.6.2,<4",
+        "opensearch-py>=2",
+        "pandas>=1.5,<3",
+        "matplotlib>=3.6.0,<4",
         "numpy>=1.24.0,<2",
+        "deprecated>=1.2.14,<2",
+        # Additional dependencies for the RAG pipeline
         "torch>=2.0.1,<2.1.0",
         "onnx>=1.15.0",
         "accelerate>=0.27",
         "sentence_transformers>=2.5.0,<2.6",
         "tqdm>=4.66.0,<5",
         "transformers>=4.36.0,<5",
-        "deprecated>=1.2.14,<2",
-        # Additional dependencies for the RAG pipeline
         "boto3>=1.26.0",
         "botocore>=1.29.0",
         "requests>=2.28.0",

From bea75e0c9b5cadd9be991cce328e243cbb1b6d49 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 29 Nov 2024 01:15:24 -0800
Subject: [PATCH 13/42] Remove .gitignore file from rag pipeline directory

- Delete opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
- Consolidate gitignore rules in the root .gitignore file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/.gitignore    | 72 -------------------
 1 file changed, 72 deletions(-)
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore b/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
deleted file mode 100644
index f6c330e7..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/.gitignore
+++ /dev/null
@@ -1,72 +0,0 @@
-# Ignore data and ingestion directories
-ml_commons/rag_pipeline/data/
-ml_commons/rag_pipeline/ingestion/
-ml_commons/rag_pipeline/rag/config.ini
-# Compiled python modules.
-*.pyc
-__pycache__/
-
-# Setuptools distribution folder.
-dist/
-
-# Build folder
-build/
-
-# docs build folder
-docs/build/
-
-# pytest results
-tests/dataframe/results/*csv
-result_images/
-
-
-# Python egg metadata, regenerated from source files by setuptools.
-/*.egg-info
-opensearch_py_ml.egg-info/
-
-# PyCharm files
-.idea/
-
-# vscode files
-.vscode/
-
-# pytest files
-.pytest_cache/
-
-# Ignore MacOSX files
-.DS_Store
-
-# Jupyter Notebook
-.ipynb_checkpoints
-
-# IPython
-profile_default/
-ipython_config.py
-
-# pyenv
-.python-version
-
-# Environments
-.env
-.venv
-.nox
-env/
-venv/
-ENV/
-env.bak/
-venv.bak/
-.mypy_cache
-
-# Coverage
-.coverage
-.coverage.*
-*-junit.xml
-*-codecov.xml
-
-#model file
-all-MiniLM-L6-v2_torchscript_sentence-transformer.zip
-# torch generated files
-tests/test_SentenceTransformerModel
-tests/ml_commons/test_model_files
-tests/ml_models/tests
-docs/source/examples/synthetic_queries
\ No newline at end of file

From f5b74ed174310d80778fcedbfbd2ca17828ee705 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 29 Nov 2024 05:13:19 -0800
Subject: [PATCH 14/42] Organized Model registration into classes

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/AIConnectorHelper.py     |  80 +-
 .../rag_pipeline/rag/IAMRoleHelper.py         |  12 +-
 .../rag/ml_models/BedrockModel.py             | 152 +++
 .../rag_pipeline/rag/ml_models/CohereModel.py | 318 ++++++
 .../rag/ml_models/CustomPyTorchModel.py       | 181 ++++
 .../rag/ml_models/HuggingFaceModel.py         | 152 +++
 .../rag_pipeline/rag/ml_models/OpenAIModel.py | 315 ++++++
 .../rag/ml_models/SageMakerModel.py           | 101 ++
 .../rag_pipeline/rag/ml_models/base_model.py  |  12 +
 .../rag_pipeline/rag/model_register.py        | 960 ++----------------
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 200 ++--
 11 files changed, 1459 insertions(+), 1024 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index 1218a589..e7babe39 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -32,6 +32,7 @@
 
 from IAMRoleHelper import IAMRoleHelper
 from SecretsHelper import SecretHelper
+from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
 
 class AIConnectorHelper:
     def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
@@ -70,6 +71,9 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
             connection_class=RequestsHttpConnection
         )
 
+        # Initialize ModelAccessControl
+        self.model_access_control = ModelAccessControl(self.opensearch_client)
+
         # Initialize IAMRoleHelper and SecretHelper
         self.iam_helper = IAMRoleHelper(
             region=self.region,
@@ -139,61 +143,31 @@ def create_connector(self, create_connector_role_name, payload):
         return connector_id
 
     def search_model_group(self, model_group_name, create_connector_role_name):
-        payload = {
-            "query": {
-                "term": {
-                    "name.keyword": {
-                        "value": model_group_name
-                    }
-                }
-            }
-        }
-        headers = {"Content-Type": "application/json"}
-
-        # Obtain temporary credentials
-        awsauth = self.get_ml_auth(create_connector_role_name)
-
-        r = requests.post(
-            f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_search',
-            auth=awsauth,
-            json=payload,
-            headers=headers
-        )
-
-        response = json.loads(r.text)
+        """
+        Utilize ModelAccessControl to search for a model group by name.
+        """
+        response = self.model_access_control.search_model_group_by_name(model_group_name, size=1)
         return response
 
     def create_model_group(self, model_group_name, description, create_connector_role_name):
-        search_model_group_response = self.search_model_group(model_group_name, create_connector_role_name)
-        print("Search Model Group Response:", search_model_group_response)
-
-        if 'hits' in search_model_group_response and search_model_group_response['hits']['total']['value'] > 0:
-            return search_model_group_response['hits']['hits'][0]['_id']
-
-        payload = {
-            "name": model_group_name,
-            "description": description
-        }
-        headers = {"Content-Type": "application/json"}
-
-        # Obtain temporary credentials using the provided role name
-        awsauth = self.get_ml_auth(create_connector_role_name)
-
-        r = requests.post(
-            f'{self.opensearch_domain_url}/_plugins/_ml/model_groups/_register',
-            auth=awsauth,
-            json=payload,
-            headers=headers
-        )
-
-        print(r.text)
-        response = json.loads(r.text)
-
-        if 'model_group_id' in response:
-            return response['model_group_id']
+        """
+        Utilize ModelAccessControl to create or retrieve an existing model group.
+        """
+        model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
+        print("Search Model Group Response:", model_group_id)
+
+        if model_group_id:
+            return model_group_id
+
+        # Use ModelAccessControl to register model group
+        self.model_access_control.register_model_group(name=model_group_name, description=description)
+        
+        # Retrieve the newly created model group id
+        model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
+        if model_group_id:
+            return model_group_id
         else:
-            # Handle error gracefully
-            raise KeyError("The response does not contain 'model_group_id'. Response content: {}".format(response))
+            raise Exception("Failed to create model group.")
 
     def get_task(self, task_id, create_connector_role_name):
         try:
@@ -378,7 +352,7 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
         print('----------')
 
-        # 4. Create connector
+        # Step 4: Create connector
         print('Step 4: Create connector in OpenSearch')
         # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
         # During this time, some services might not immediately recognize the new role or its permissions.
@@ -479,7 +453,7 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
         print('----------')
 
-        # 3. Create connector
+        # Step 3: Create connector
         print('Step 3: Create connector in OpenSearch')
         # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
         # During this time, some services might not immediately recognize the new role or its permissions.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
index 9f0d85f6..e39968b0 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
@@ -187,4 +187,14 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
             print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
         else:
             print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
-            print(f"Response: {response.text}")
\ No newline at end of file
+            print(f"Response: {response.text}")
+
+    def get_iam_user_name_from_arn(self, iam_principal_arn):
+        """
+        Extract the IAM user name from the IAM principal ARN.
+        """
+        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
+        if iam_principal_arn and ':user/' in iam_principal_arn:
+            return iam_principal_arn.split(':user/')[-1]
+        else:
+            return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
new file mode 100644
index 00000000..0b63787e
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
@@ -0,0 +1,152 @@
+# BedrockModel.py
+
+import json
+from colorama import Fore, Style
+
+class BedrockModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the BedrockModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_bedrock_model(self, helper, config, save_config_method):
+        """
+        Register a Managed Bedrock embedding model by creating the necessary connector and model in OpenSearch.
+
+        Args:
+            helper (AIConnectorHelper): Instance of AIConnectorHelper.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        # Prompt for necessary inputs
+        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
+        connector_role_name = "my_test_bedrock_connector_role"
+        create_connector_role_name = "my_test_create_bedrock_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["bedrock:InvokeModel"],
+                    "Effect": "Allow",
+                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
+                }
+            ]
+        }
+
+        # Default connector input
+        default_connector_input = {
+            "name": "Amazon Bedrock Connector: titan embedding v1",
+            "description": "The connector to Bedrock Titan embedding model",
+            "version": 1,
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": bedrock_region,
+                "service_name": "bedrock"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
+                    "headers": {
+                        "content-type": "application/json",
+                        "x-amz-content-sha256": "required"
+                    },
+                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
+                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
+                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        print("Creating Bedrock connector...")
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create Bedrock connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        print("Registering Bedrock model...")
+        model_name = create_connector_input.get('name', 'Bedrock embedding model')
+        description = create_connector_input.get('description', 'Bedrock embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create Bedrock model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        self.save_model_id(config, save_config_method, model_id)
+        print(f"{Fore.GREEN}Bedrock model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+
+    def save_model_id(self, config, save_config_method, model_id):
+        """
+        Save the model ID to the configuration.
+
+        Args:
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+            model_id (str): The model ID to save.
+        """
+        config['embedding_model_id'] = model_id
+        save_config_method(config)
+
+    def get_custom_model_details(self, default_input):
+        """
+        Prompt the user to enter custom model details or use default.
+        Returns a dictionary with the model details.
+
+        Args:
+            default_input (dict): Default model configuration.
+
+        Returns:
+            dict or None: Custom or default model configuration, or None if invalid input.
+        """
+        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom model settings")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            return default_input
+        elif choice == '2':
+            print("Please enter your model details as a JSON object.")
+            print("Example:")
+            print(json.dumps(default_input, indent=2))
+            json_input = input("Enter your JSON object: ").strip()
+            try:
+                custom_details = json.loads(json_input)
+                return custom_details
+            except json.JSONDecodeError as e:
+                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+                return None
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
new file mode 100644
index 00000000..ef84362d
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
@@ -0,0 +1,318 @@
+# CohereModel.py
+import json
+from colorama import Fore, Style
+import time
+class CohereModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the CohereModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_cohere_model(self, helper, config, save_config_method):
+        """
+        Register a Managed Cohere embedding model by creating the necessary connector and model in OpenSearch.
+
+        Args:
+            helper (AIConnectorHelper): Instance of AIConnectorHelper.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'cohere_api_key'
+        cohere_api_key = input("Enter your Cohere API key: ")
+        secret_value = {secret_key: cohere_api_key}
+
+        connector_role_name = "my_test_cohere_connector_role"
+        create_connector_role_name = "my_test_create_cohere_connector_role"
+
+        # Default connector input
+        default_connector_input = {
+            "name": "Cohere Embedding Model Connector",
+            "description": "Connector for Cohere embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "embed-english-v3.0",
+                "input_type": "search_document",
+                "truncate": "END"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.cohere.ai/v1/embed",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                        "Request-Source": "unspecified:opensearch"
+                    },
+                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                    "pre_process_function": "connector.pre_process.cohere.embedding",
+                    "post_process_function": "connector.post_process.cohere.embedding"
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = create_connector_input.get('name', 'Cohere embedding model')
+        description = create_connector_input.get('description', 'Cohere embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        config['embedding_model_id'] = model_id
+        save_config_method(config)
+        print(f"{Fore.GREEN}Cohere model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+
+    def register_cohere_model_opensource(self, opensearch_client, config, save_config_method):
+        """
+        Register a Cohere embedding model in open-source OpenSearch.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        cohere_api_key = input("Enter your Cohere API key: ").strip()
+        if not cohere_api_key:
+            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
+            return
+
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            connector_payload = {
+                "name": "Cohere Embedding Connector",
+                "description": "Connector for Cohere embedding model",
+                "version": "1.0",
+                "protocol": "http",
+                "parameters": {
+                    "model": "embed-english-v3.0",
+                    "input_type": "search_document",
+                    "truncate": "END"
+                },
+                "credential": {
+                    "cohere_key": cohere_api_key
+                },
+                "actions": [
+                    {
+                        "action_type": "predict",
+                        "method": "POST",
+                        "url": "https://api.cohere.ai/v1/embed",
+                        "headers": {
+                            "Authorization": "Bearer ${credential.cohere_key}",
+                            "Request-Source": "unspecified:opensearch"
+                        },
+                        "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                        "pre_process_function": "connector.pre_process.cohere.embedding",
+                        "post_process_function": "connector.post_process.cohere.embedding"
+                    }
+                ]
+            }
+            model_group_payload = {
+                "name": f"cohere_model_group_{int(time.time())}",
+                "description": "Model group for Cohere models"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            print("\nPlease enter your connector details as a JSON object.")
+            connector_payload = self.get_custom_json_input()
+            if not connector_payload:
+                return
+
+            print("\nPlease enter your model group details as a JSON object.")
+            model_group_payload = self.get_custom_json_input()
+            if not model_group_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the connector
+        try:
+            connector_response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/connectors/_create",
+                body=connector_payload
+            )
+            connector_id = connector_response.get('connector_id')
+            if not connector_id:
+                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
+            return
+
+        # Create model group
+        try:
+            model_group_response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/model_groups/_register",
+                body=model_group_payload
+            )
+            model_group_id = model_group_response.get('model_group_id')
+            if not model_group_id:
+                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
+            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
+                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
+                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            else:
+                return
+
+        # Create model payload
+        model_payload = {
+            "name": connector_payload.get('name', 'Cohere embedding model'),
+            "function_name": "REMOTE",
+            "model_group_id": model_group_id,
+            "description": connector_payload.get('description', 'Cohere embedding model for semantic search'),
+            "connector_id": connector_id
+        }
+
+        # Register the model
+        try:
+            response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(opensearch_client, task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    config['embedding_model_id'] = model_id
+                    save_config_method(config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def get_custom_model_details(self, default_input):
+        """
+        Prompt the user to enter custom model details or use default.
+        Returns a dictionary with the model details.
+
+        Args:
+            default_input (dict): Default model configuration.
+
+        Returns:
+            dict or None: Custom or default model configuration, or None if invalid input.
+        """
+        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom model settings")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            return default_input
+        elif choice == '2':
+            print("Please enter your model details as a JSON object.")
+            print("Example:")
+            print(json.dumps(default_input, indent=2))
+            json_input = input("Enter your JSON object: ").strip()
+            try:
+                custom_details = json.loads(json_input)
+                return custom_details
+            except json.JSONDecodeError as e:
+                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+                return None
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return None
+
+    def get_custom_json_input(self):
+        """Helper method to get custom JSON input from the user."""
+        json_input = input("Enter your JSON object: ").strip()
+        try:
+            return json.loads(json_input)
+        except json.JSONDecodeError as e:
+            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+            return None
+
+    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            task_id (str): Task ID to monitor.
+            timeout (int): Maximum time to wait in seconds.
+            interval (int): Time between status checks in seconds.
+
+        Returns:
+            str or None: The model ID if successful, else None.
+        """
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
new file mode 100644
index 00000000..6c6379f6
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
@@ -0,0 +1,181 @@
+# CustomPyTorchModel.py
+import json
+from colorama import Fore, Style
+import os
+import time
+
+class CustomPyTorchModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the CustomPyTorchModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_custom_pytorch_model(self, opensearch_client, config, save_config_method):
+        """
+        Register a custom PyTorch embedding model in open-source OpenSearch.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+            if not os.path.isfile(model_path):
+                print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+                return
+
+            model_name = os.path.basename(model_path).split('.')[0]
+            model_payload = {
+                "name": f"custom_pytorch_{model_name}",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "framework_type": "CUSTOM",
+                    "model_type": "bert"
+                },
+                "description": f"Custom PyTorch model: {model_name}"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+            if not os.path.isfile(model_path):
+                print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+                return
+
+            print("\nPlease enter your model details as a JSON object.")
+            print("Example:")
+            example_payload = {
+                "name": "custom_pytorch_model",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "framework_type": "CUSTOM",
+                    "model_type": "bert"
+                },
+                "description": "Custom PyTorch model for semantic search"
+            }
+            print(json.dumps(example_payload, indent=2))
+            
+            model_payload = self.get_custom_json_input()
+            if not model_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Upload the model file to OpenSearch
+        try:
+            with open(model_path, 'rb') as f:
+                model_content = f.read()
+
+            # Use the ML plugin's model upload API
+            upload_response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_upload",
+                params={"model_name": model_payload['name']},
+                body=model_content,
+                headers={'Content-Type': 'application/octet-stream'}
+            )
+            if 'model_id' not in upload_response:
+                print(f"{Fore.RED}Failed to upload model. Response: {upload_response}{Style.RESET_ALL}")
+                return
+            model_id = upload_response['model_id']
+            print(f"{Fore.GREEN}Model uploaded successfully. Model ID: {model_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error uploading model: {ex}{Style.RESET_ALL}")
+            return
+
+        # Add the model_id to the payload
+        model_payload['model_id'] = model_id
+
+        # Register the model
+        try:
+            response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                registered_model_id = self.wait_for_model_registration(opensearch_client, task_id)
+                if registered_model_id:
+                    # Deploy the model
+                    deploy_response = opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{registered_model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {registered_model_id}{Style.RESET_ALL}")
+                    config['embedding_model_id'] = registered_model_id
+                    save_config_method(config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def get_custom_json_input(self):
+        """Helper method to get custom JSON input from the user."""
+        json_input = input("Enter your JSON object: ").strip()
+        try:
+            return json.loads(json_input)
+        except json.JSONDecodeError as e:
+            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+            return None
+
+    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            task_id (str): Task ID to monitor.
+            timeout (int): Maximum time to wait in seconds.
+            interval (int): Time between status checks in seconds.
+
+        Returns:
+            str or None: The model ID if successful, else None.
+        """
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
new file mode 100644
index 00000000..77765845
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
@@ -0,0 +1,152 @@
+# HuggingFaceModel.py
+import json
+from colorama import Fore, Style
+import time
+
+class HuggingFaceModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the HuggingFaceModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_huggingface_model(self, opensearch_client, config, save_config_method):
+        """
+        Register a Hugging Face Transformers embedding model in open-source OpenSearch.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            model_name = "sentence-transformers/all-MiniLM-L6-v2"
+            model_payload = {
+                "name": f"huggingface_{model_name.split('/')[-1]}",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "framework_type": "SENTENCE_TRANSFORMERS",
+                    "model_type": "bert",
+                    "embedding_model": model_name
+                },
+                "description": f"Hugging Face Transformers model: {model_name}"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            model_name = input("Enter the Hugging Face model ID (e.g., 'sentence-transformers/all-MiniLM-L6-v2'): ").strip()
+            if not model_name:
+                print(f"{Fore.RED}Model ID is required. Aborting.{Style.RESET_ALL}")
+                return
+
+            print("\nPlease enter your model details as a JSON object.")
+            print("Example:")
+            example_payload = {
+                "name": f"huggingface_{model_name.split('/')[-1]}",
+                "model_format": "TORCH_SCRIPT",
+                "model_config": {
+                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "framework_type": "SENTENCE_TRANSFORMERS",
+                    "model_type": "bert",
+                    "embedding_model": model_name
+                },
+                "description": f"Hugging Face Transformers model: {model_name}"
+            }
+            print(json.dumps(example_payload, indent=2))
+            
+            model_payload = self.get_custom_json_input()
+            if not model_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the model
+        try:
+            response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(opensearch_client, task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    config['embedding_model_id'] = model_id
+                    save_config_method(config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def get_custom_json_input(self):
+        """Helper method to get custom JSON input from the user."""
+        json_input = input("Enter your JSON object: ").strip()
+        try:
+            return json.loads(json_input)
+        except json.JSONDecodeError as e:
+            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+            return None
+
+    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            task_id (str): Task ID to monitor.
+            timeout (int): Maximum time to wait in seconds.
+            interval (int): Time between status checks in seconds.
+
+        Returns:
+            str or None: The model ID if successful, else None.
+        """
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
new file mode 100644
index 00000000..1fc8a937
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
@@ -0,0 +1,315 @@
+# OpenAIModel.py
+import json
+from colorama import Fore, Style
+import time
+
+class OpenAIModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the OpenAIModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_openai_model(self, helper, config, save_config_method):
+        """
+        Register a Managed OpenAI embedding model by creating the necessary connector and model in OpenSearch.
+
+        Args:
+            helper (AIConnectorHelper): Instance of AIConnectorHelper.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        # Prompt for necessary inputs
+        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
+        secret_key = 'openai_api_key'
+        openai_api_key = input("Enter your OpenAI API key: ")
+        secret_value = {secret_key: openai_api_key}
+
+        connector_role_name = "my_test_openai_connector_role"
+        create_connector_role_name = "my_test_create_openai_connector_role"
+
+        # Default connector input
+        default_connector_input = {
+            "name": "OpenAI Embedding Model Connector",
+            "description": "Connector for OpenAI embedding model",
+            "version": "1.0",
+            "protocol": "http",
+            "parameters": {
+                "model": "text-embedding-ada-002"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "url": "https://api.openai.com/v1/embeddings",
+                    "headers": {
+                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
+                        "Content-Type": "application/json"
+                    },
+                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                    "pre_process_function": "connector.pre_process.openai.embedding",
+                    "post_process_function": "connector.post_process.openai.embedding"
+                }
+            ]
+        }
+
+        # Get model details from user
+        create_connector_input = self.get_custom_model_details(default_connector_input)
+        if not create_connector_input:
+            return  # Abort if no valid input
+
+        # Create connector
+        connector_id = helper.create_connector_with_secret(
+            secret_name,
+            secret_value,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = create_connector_input.get('name', 'OpenAI embedding model')
+        description = create_connector_input.get('description', 'OpenAI embedding model for semantic search')
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        config['embedding_model_id'] = model_id
+        save_config_method(config)
+        print(f"{Fore.GREEN}OpenAI model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+
+    def register_openai_model_opensource(self, opensearch_client, config, save_config_method):
+        """
+        Register an OpenAI embedding model in open-source OpenSearch.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        openai_api_key = input("Enter your OpenAI API key: ").strip()
+        if not openai_api_key:
+            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
+            return
+
+        print("\nDo you want to use the default configuration or provide custom settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom settings")
+        config_choice = input("Enter your choice (1-2): ").strip()
+
+        if config_choice == '1':
+            # Use default configurations
+            connector_payload = {
+                "name": "OpenAI Embedding Connector",
+                "description": "Connector for OpenAI embedding model",
+                "version": "1",
+                "protocol": "http",
+                "parameters": {
+                    "model": "text-embedding-ada-002"
+                },
+                "credential": {
+                    "openAI_key": openai_api_key
+                },
+                "actions": [
+                    {
+                        "action_type": "predict",
+                        "method": "POST",
+                        "url": "https://api.openai.com/v1/embeddings",
+                        "headers": {
+                            "Authorization": "Bearer ${credential.openAI_key}",
+                            "Content-Type": "application/json"
+                        },
+                        "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                        "pre_process_function": "connector.pre_process.openai.embedding",
+                        "post_process_function": "connector.post_process.openai.embedding"
+                    }
+                ]
+            }
+            model_group_payload = {
+                "name": f"openai_model_group_{int(time.time())}",
+                "description": "Model group for OpenAI models"
+            }
+        elif config_choice == '2':
+            # Get custom configurations
+            print("\nPlease enter your connector details as a JSON object.")
+            connector_payload = self.get_custom_json_input()
+            if not connector_payload:
+                return
+
+            print("\nPlease enter your model group details as a JSON object.")
+            model_group_payload = self.get_custom_json_input()
+            if not model_group_payload:
+                return
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return
+
+        # Register the connector
+        try:
+            connector_response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/connectors/_create",
+                body=connector_payload
+            )
+            connector_id = connector_response.get('connector_id')
+            if not connector_id:
+                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
+            return
+
+        # Create model group
+        try:
+            model_group_response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/model_groups/_register",
+                body=model_group_payload
+            )
+            model_group_id = model_group_response.get('model_group_id')
+            if not model_group_id:
+                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                return
+            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
+            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
+                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
+                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            else:
+                return
+
+        # Create model payload
+        model_payload = {
+            "name": connector_payload.get('name', 'OpenAI embedding model'),
+            "function_name": "REMOTE",
+            "model_group_id": model_group_id,
+            "description": connector_payload.get('description', 'OpenAI embedding model for semantic search'),
+            "connector_id": connector_id
+        }
+
+        # Register the model
+        try:
+            response = opensearch_client.transport.perform_request(
+                method="POST",
+                url="/_plugins/_ml/models/_register",
+                body=model_payload
+            )
+            task_id = response.get('task_id')
+            if task_id:
+                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                # Wait for the task to complete and retrieve the model_id
+                model_id = self.wait_for_model_registration(opensearch_client, task_id)
+                if model_id:
+                    # Deploy the model
+                    deploy_response = opensearch_client.transport.perform_request(
+                        method="POST",
+                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
+                    config['embedding_model_id'] = model_id
+                    save_config_method(config)
+                else:
+                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+            else:
+                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+
+    def get_custom_model_details(self, default_input):
+        """
+        Prompt the user to enter custom model details or use default.
+        Returns a dictionary with the model details.
+
+        Args:
+            default_input (dict): Default model configuration.
+
+        Returns:
+            dict or None: Custom or default model configuration, or None if invalid input.
+        """
+        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print("1. Use default configuration")
+        print("2. Provide custom model settings")
+        choice = input("Enter your choice (1-2): ").strip()
+
+        if choice == '1':
+            return default_input
+        elif choice == '2':
+            print("Please enter your model details as a JSON object.")
+            print("Example:")
+            print(json.dumps(default_input, indent=2))
+            json_input = input("Enter your JSON object: ").strip()
+            try:
+                custom_details = json.loads(json_input)
+                return custom_details
+            except json.JSONDecodeError as e:
+                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+                return None
+        else:
+            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            return None
+
+    def get_custom_json_input(self):
+        """Helper method to get custom JSON input from the user."""
+        json_input = input("Enter your JSON object: ").strip()
+        try:
+            return json.loads(json_input)
+        except json.JSONDecodeError as e:
+            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+            return None
+
+    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+        """
+        Wait for the model registration task to complete and return the model_id.
+
+        Args:
+            opensearch_client: OpenSearch client instance.
+            task_id (str): Task ID to monitor.
+            timeout (int): Maximum time to wait in seconds.
+            interval (int): Time between status checks in seconds.
+
+        Returns:
+            str or None: The model ID if successful, else None.
+        """
+        end_time = time.time() + timeout
+        while time.time() < end_time:
+            try:
+                response = opensearch_client.transport.perform_request(
+                    method="GET",
+                    url=f"/_plugins/_ml/tasks/{task_id}"
+                )
+                state = response.get('state')
+                if state == 'COMPLETED':
+                    model_id = response.get('model_id')
+                    return model_id
+                elif state in ['FAILED', 'STOPPED']:
+                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                    return None
+                else:
+                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    time.sleep(interval)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
+                time.sleep(interval)
+        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
new file mode 100644
index 00000000..3288a8a2
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
@@ -0,0 +1,101 @@
+# SageMakerModel.py
+import json
+from colorama import Fore, Style
+
+class SageMakerModel:
+    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+        """
+        Initializes the SageMakerModel with necessary configurations.
+        
+        Args:
+            aws_region (str): AWS region.
+            opensearch_domain_name (str): OpenSearch domain name.
+            opensearch_username (str): OpenSearch username.
+            opensearch_password (str): OpenSearch password.
+            iam_role_helper (IAMRoleHelper): Instance of IAMRoleHelper.
+        """
+        self.aws_region = aws_region
+        self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_username = opensearch_username
+        self.opensearch_password = opensearch_password
+        self.iam_role_helper = iam_role_helper
+
+    def register_sagemaker_model(self, helper, config, save_config_method):
+        """
+        Register a SageMaker embedding model by creating the necessary connector and model in OpenSearch.
+
+        Args:
+            helper (AIConnectorHelper): Instance of AIConnectorHelper.
+            config (dict): Configuration dictionary.
+            save_config_method (function): Method to save the configuration.
+        """
+        # Prompt for necessary inputs
+        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ").strip()
+        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ").strip()
+        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ").strip() or self.aws_region
+        connector_role_name = "my_test_sagemaker_connector_role"
+        create_connector_role_name = "my_test_create_sagemaker_connector_role"
+
+        # Set up connector role inline policy
+        connector_role_inline_policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Action": ["sagemaker:InvokeEndpoint"],
+                    "Effect": "Allow",
+                    "Resource": sagemaker_endpoint_arn
+                }
+            ]
+        }
+
+        # Create connector input
+        create_connector_input = {
+            "name": "SageMaker Embedding Model Connector",
+            "description": "Connector for SageMaker embedding model",
+            "version": "1.0",
+            "protocol": "aws_sigv4",
+            "parameters": {
+                "region": sagemaker_region,
+                "service_name": "sagemaker"
+            },
+            "actions": [
+                {
+                    "action_type": "predict",
+                    "method": "POST",
+                    "headers": {
+                        "Content-Type": "application/json"
+                    },
+                    "url": sagemaker_endpoint_url,
+                    "request_body": "${parameters.input}",
+                    "pre_process_function": "connector.pre_process.default.embedding",
+                    "post_process_function": "connector.post_process.default.embedding"
+                }
+            ]
+        }
+
+        # Create connector
+        connector_id = helper.create_connector_with_role(
+            connector_role_inline_policy,
+            connector_role_name,
+            create_connector_role_name,
+            create_connector_input,
+            sleep_time_in_seconds=10
+        )
+
+        if not connector_id:
+            print(f"{Fore.RED}Failed to create SageMaker connector. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Register model
+        model_name = "SageMaker Embedding Model"
+        description = "SageMaker embedding model for semantic search"
+        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+
+        if not model_id:
+            print(f"{Fore.RED}Failed to create SageMaker model. Aborting.{Style.RESET_ALL}")
+            return
+
+        # Save model_id to config
+        config['embedding_model_id'] = model_id
+        save_config_method(config)
+        print(f"{Fore.GREEN}SageMaker model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py
new file mode 100644
index 00000000..7ca846a1
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py
@@ -0,0 +1,12 @@
+# models/base_model.py
+
+from abc import ABC, abstractmethod
+
+class BaseModelRegister(ABC):
+    def __init__(self, config, helper):
+        self.config = config
+        self.helper = helper
+
+    @abstractmethod
+    def register_model(self):
+        pass
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
index 876c22d4..bd42276b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -1,3 +1,4 @@
+# ModelRegister.py
 # SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
@@ -24,14 +25,19 @@
 #  under the License.
 
 
-
 import os
 import json
 import time
 import boto3
 from urllib.parse import urlparse
 from colorama import Fore, Style, init
-from AIConnectorHelper import AIConnectorHelper  # Ensure this module is accessible
+from AIConnectorHelper import AIConnectorHelper
+from IAMRoleHelper import IAMRoleHelper
+from ml_models.BedrockModel import BedrockModel
+from ml_models.OpenAIModel import OpenAIModel
+from ml_models.CohereModel import CohereModel
+from ml_models.HuggingFaceModel import HuggingFaceModel
+from ml_models.CustomPyTorchModel import CustomPyTorchModel
 import sys
 
 init(autoreset=True)
@@ -48,9 +54,50 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
         self.iam_principal = config.get('iam_principal')
         self.embedding_dimension = int(config.get('embedding_dimension', 768))
         self.service_type = config.get('service_type', 'managed')
-        self.bedrock_client = None
+        self.iam_role_helper = IAMRoleHelper(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.iam_principal
+        )
         if self.service_type != 'open-source':
             self.initialize_clients()
+        self.bedrock_model = BedrockModel(
+            aws_region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_username=self.opensearch_username,
+            opensearch_password=self.opensearch_password,
+            iam_role_helper=self.iam_role_helper
+        )
+        self.openai_model = OpenAIModel(
+            aws_region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_username=self.opensearch_username,
+            opensearch_password=self.opensearch_password,
+            iam_role_helper=self.iam_role_helper
+        )
+        self.cohere_model = CohereModel(
+            aws_region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_username=self.opensearch_username,
+            opensearch_password=self.opensearch_password,
+            iam_role_helper=self.iam_role_helper
+        )
+        self.huggingface_model = HuggingFaceModel(
+            aws_region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_username=self.opensearch_username,
+            opensearch_password=self.opensearch_password,
+            iam_role_helper=self.iam_role_helper
+        )
+        self.custom_pytorch_model = CustomPyTorchModel(
+            aws_region=self.aws_region,
+            opensearch_domain_name=self.opensearch_domain_name,
+            opensearch_username=self.opensearch_username,
+            opensearch_password=self.opensearch_password,
+            iam_role_helper=self.iam_role_helper
+        )
 
     def initialize_clients(self):
         # Initialize AWS clients only if necessary
@@ -91,33 +138,7 @@ def prompt_model_registration(self):
         else:
             print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}")
             sys.exit(1)  # Exit the setup as we cannot proceed without a valid choice
-    def get_custom_model_details(self, default_input):
-        """
-        Prompt the user to enter custom model details or use default.
-        Returns a dictionary with the model details.
-        """
-        print("\nDo you want to use the default configuration or provide custom model settings?")
-        print("1. Use default configuration")
-        print("2. Provide custom model settings")
-        choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
-            return default_input
-        elif choice == '2':
-            print("Please enter your model details as a JSON object.")
-            print("Example:")
-            print(json.dumps(default_input, indent=2))
-            json_input = input("Enter your JSON object: ").strip()
-            try:
-                custom_details = json.loads(json_input)
-                return custom_details
-            except json.JSONDecodeError as e:
-                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
-                return None
-        else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-            return None
-        
     def save_config(self, config):
         # Save configuration to the config file
         import configparser
@@ -141,7 +162,7 @@ def register_model_interactive(self):
             return
 
         # Extract the IAM user name from the IAM principal ARN
-        aws_user_name = self.get_iam_user_name_from_arn(self.iam_principal)
+        aws_user_name = self.iam_role_helper.get_iam_user_name_from_arn(self.iam_principal)
 
         if not aws_user_name:
             print("Could not extract IAM user name from IAM principal ARN.")
@@ -159,335 +180,40 @@ def register_model_interactive(self):
 
         # Prompt user to select a model
         print("Please select an embedding model to register:")
-        print("1. Bedrock Titan Embedding Model")
-        print("2. SageMaker Embedding Model")
+        print("1. Bedrock Embedding Model")
+        print("2. OpenAI Embedding Model")
         print("3. Cohere Embedding Model")
-        print("4. OpenAI Embedding Model")
-        model_choice = input("Enter your choice (1-4): ")
+        print("4. Hugging Face Transformers Model")
+        print("5. Custom PyTorch Model")
+        model_choice = input("Enter your choice (1-5): ")
 
         # Call the appropriate method based on the user's choice
         if model_choice == '1':
-            self.register_bedrock_model(helper)
+            self.bedrock_model.register_bedrock_model(helper, self.config, self.save_config)
         elif model_choice == '2':
-            self.register_sagemaker_model(helper)
+            if self.service_type != 'open-source':
+                self.openai_model.register_openai_model(helper, self.config, self.save_config)
+            else:
+                self.openai_model.register_openai_model_opensource(self.opensearch_client, self.config, self.save_config)
         elif model_choice == '3':
-            self.register_cohere_model(helper)
+            if self.service_type != 'open-source':
+                self.cohere_model.register_cohere_model(helper, self.config, self.save_config)
+            else:
+                self.cohere_model.register_cohere_model_opensource(self.opensearch_client, self.config, self.save_config)
         elif model_choice == '4':
-            self.register_openai_model(helper)
+            if self.service_type != 'open-source':
+                print(f"{Fore.RED}Hugging Face Transformers models are only supported in open-source OpenSearch.{Style.RESET_ALL}")
+            else:
+                self.huggingface_model.register_huggingface_model(self.opensearch_client, self.config, self.save_config)
+        elif model_choice == '5':
+            if self.service_type != 'open-source':
+                print(f"{Fore.RED}Custom PyTorch models are only supported in open-source OpenSearch.{Style.RESET_ALL}")
+            else:
+                self.custom_pytorch_model.register_custom_pytorch_model(self.opensearch_client, self.config, self.save_config)
         else:
             print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
             return
 
-    def get_iam_user_name_from_arn(self, iam_principal_arn):
-        """
-        Extract the IAM user name from the IAM principal ARN.
-        """
-        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
-        if iam_principal_arn and ':user/' in iam_principal_arn:
-            return iam_principal_arn.split(':user/')[-1]
-        else:
-            return None
-
-    def register_bedrock_model(self, helper):
-        """
-        Register a Bedrock embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
-        connector_role_name = "my_test_bedrock_connector_role"
-        create_connector_role_name = "my_test_create_bedrock_connector_role"
-
-        # Set up connector role inline policy
-        connector_role_inline_policy = {
-            "Version": "2012-10-17",
-            "Statement": [
-                {
-                    "Action": ["bedrock:InvokeModel"],
-                    "Effect": "Allow",
-                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
-                }
-            ]
-        }
-
-        # Default connector input
-        default_connector_input = {
-            "name": "Amazon Bedrock Connector: titan embedding v1",
-            "description": "The connector to Bedrock Titan embedding model",
-            "version": 1,
-            "protocol": "aws_sigv4",
-            "parameters": {
-                "region": bedrock_region,
-                "service_name": "bedrock"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
-                    "headers": {
-                        "content-type": "application/json",
-                        "x-amz-content-sha256": "required"
-                    },
-                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
-                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
-                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
-                }
-            ]
-        }
-
-        # Get model details from user
-        create_connector_input = self.get_custom_model_details(default_connector_input)
-        if not create_connector_input:
-            return  # Abort if no valid input
-
-        # Create connector
-        print("Creating connector...")
-        connector_id = helper.create_connector_with_role(
-            connector_role_inline_policy,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        print("Registering model...")
-        model_name = create_connector_input.get('name', 'Bedrock embedding model')
-        description = create_connector_input.get('description', 'Bedrock embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
-        
-    def register_sagemaker_model(self, helper):
-        """
-        Register a SageMaker embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ")
-        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ")
-        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ") or self.aws_region
-        connector_role_name = "my_test_sagemaker_connector_role"
-        create_connector_role_name = "my_test_create_sagemaker_connector_role"
-
-        # Set up connector role inline policy
-        connector_role_inline_policy = {
-            "Version": "2012-10-17",
-            "Statement": [
-                {
-                    "Action": ["sagemaker:InvokeEndpoint"],
-                    "Effect": "Allow",
-                    "Resource": sagemaker_endpoint_arn
-                }
-            ]
-        }
-
-        # Create connector input
-        create_connector_input = {
-            "name": "SageMaker embedding model connector",
-            "description": "Connector for my SageMaker embedding model",
-            "version": "1.0",
-            "protocol": "aws_sigv4",
-            "parameters": {
-                "region": sagemaker_region,
-                "service_name": "sagemaker"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "headers": {
-                        "content-type": "application/json"
-                    },
-                    "url": sagemaker_endpoint_url,
-                    "request_body": "${parameters.input}",
-                    "pre_process_function": "connector.pre_process.default.embedding",
-                    "post_process_function": "connector.post_process.default.embedding"
-                }
-            ]
-        }
-
-        # Create connector
-        connector_id = helper.create_connector_with_role(
-            connector_role_inline_policy,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = 'SageMaker embedding model'
-        description = 'SageMaker embedding model for semantic search'
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
-
-    def register_cohere_model(self, helper):
-        """
-        Register a Cohere embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'cohere_api_key'
-        cohere_api_key = input("Enter your Cohere API key: ")
-        secret_value = {secret_key: cohere_api_key}
-
-        connector_role_name = "my_test_cohere_connector_role"
-        create_connector_role_name = "my_test_create_cohere_connector_role"
-
-        # Default connector input
-        default_connector_input = {
-            "name": "Cohere Embedding Model Connector",
-            "description": "Connector for Cohere embedding model",
-            "version": "1.0",
-            "protocol": "http",
-            "parameters": {
-                "model": "embed-english-v3.0",
-                "input_type": "search_document",
-                "truncate": "END"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": "https://api.cohere.ai/v1/embed",
-                    "headers": {
-                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                        "Request-Source": "unspecified:opensearch"
-                    },
-                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
-                    "pre_process_function": "connector.pre_process.cohere.embedding",
-                    "post_process_function": "connector.post_process.cohere.embedding"
-                }
-            ]
-        }
-
-        # Get model details from user
-        create_connector_input = self.get_custom_model_details(default_connector_input)
-        if not create_connector_input:
-            return  # Abort if no valid input
-
-        # Create connector
-        connector_id = helper.create_connector_with_secret(
-            secret_name,
-            secret_value,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = create_connector_input.get('name', 'Cohere embedding model')
-        description = create_connector_input.get('description', 'Cohere embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
-
-    def register_openai_model(self, helper):
-        """
-        Register an OpenAI embedding model by creating the necessary connector and model in OpenSearch.
-        """
-        # Prompt for necessary inputs
-        secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'openai_api_key'
-        openai_api_key = input("Enter your OpenAI API key: ")
-        secret_value = {secret_key: openai_api_key}
-
-        connector_role_name = "my_test_openai_connector_role"
-        create_connector_role_name = "my_test_create_openai_connector_role"
-
-        # Default connector input
-        default_connector_input = {
-            "name": "OpenAI Embedding Model Connector",
-            "description": "Connector for OpenAI embedding model",
-            "version": "1.0",
-            "protocol": "http",
-            "parameters": {
-                "model": "text-embedding-ada-002"
-            },
-            "actions": [
-                {
-                    "action_type": "predict",
-                    "method": "POST",
-                    "url": "https://api.openai.com/v1/embeddings",
-                    "headers": {
-                        "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                        "Content-Type": "application/json"
-                    },
-                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
-                    "pre_process_function": "connector.pre_process.openai.embedding",
-                    "post_process_function": "connector.post_process.openai.embedding"
-                }
-            ]
-        }
-
-        # Get model details from user
-        create_connector_input = self.get_custom_model_details(default_connector_input)
-        if not create_connector_input:
-            return  # Abort if no valid input
-
-        # Create connector
-        connector_id = helper.create_connector_with_secret(
-            secret_name,
-            secret_value,
-            connector_role_name,
-            create_connector_role_name,
-            create_connector_input,
-            sleep_time_in_seconds=10
-        )
-
-        if not connector_id:
-            print(f"{Fore.RED}Failed to create connector. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Register model
-        model_name = create_connector_input.get('name', 'OpenAI embedding model')
-        description = create_connector_input.get('description', 'OpenAI embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
-
-        if not model_id:
-            print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
-            return
-
-        # Save model_id to config
-        self.config['embedding_model_id'] = model_id
-        self.save_config(self.config)
-        print(f"{Fore.GREEN}Model registered successfully. Model ID: {model_id}{Style.RESET_ALL}")
-
     def prompt_opensource_model_registration(self):
         """
         Handle model registration for open-source OpenSearch.
@@ -515,544 +241,20 @@ def register_model_opensource_interactive(self):
 
         # Prompt user to select a model
         print("\nPlease select an embedding model to register:")
-        print("1. Cohere Embedding Model")
-        print("2. OpenAI Embedding Model")
+        print("1. OpenAI Embedding Model")
+        print("2. Cohere Embedding Model")
         print("3. Hugging Face Transformers Model")
         print("4. Custom PyTorch Model")
         model_choice = input("Enter your choice (1-4): ")
 
         if model_choice == '1':
-            self.register_cohere_model_opensource()
+            self.openai_model.register_openai_model_opensource(self.opensearch_client, self.config, self.save_config)
         elif model_choice == '2':
-            self.register_openai_model_opensource()
+            self.cohere_model.register_cohere_model_opensource(self.opensearch_client, self.config, self.save_config)
         elif model_choice == '3':
-            self.register_huggingface_model()
+            self.huggingface_model.register_huggingface_model(self.opensearch_client, self.config, self.save_config)
         elif model_choice == '4':
-            self.register_custom_pytorch_model()
+            self.custom_pytorch_model.register_custom_pytorch_model(self.opensearch_client, self.config, self.save_config)
         else:
             print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
-            return
-
-    def register_cohere_model_opensource(self):
-        """
-        Register a Cohere embedding model in open-source OpenSearch.
-        """
-        cohere_api_key = input("Enter your Cohere API key: ").strip()
-        if not cohere_api_key:
-            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
-            return
-
-        print("\nDo you want to use the default configuration or provide custom settings?")
-        print("1. Use default configuration")
-        print("2. Provide custom settings")
-        config_choice = input("Enter your choice (1-2): ").strip()
-
-        if config_choice == '1':
-            # Use default configurations
-            connector_payload = {
-                "name": "Cohere Embedding Connector",
-                "description": "Connector for Cohere embedding model",
-                "version": "1.0",
-                "protocol": "http",
-                "parameters": {
-                    "model": "embed-english-v3.0",
-                    "input_type": "search_document",
-                    "truncate": "END"
-                },
-                "credential": {
-                    "cohere_key": cohere_api_key
-                },
-                "actions": [
-                    {
-                        "action_type": "predict",
-                        "method": "POST",
-                        "url": "https://api.cohere.ai/v1/embed",
-                        "headers": {
-                            "Authorization": "Bearer ${credential.cohere_key}",
-                            "Request-Source": "unspecified:opensearch"
-                        },
-                        "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
-                        "pre_process_function": "connector.pre_process.cohere.embedding",
-                        "post_process_function": "connector.post_process.cohere.embedding"
-                    }
-                ]
-            }
-            model_group_payload = {
-                "name": f"cohere_model_group_{int(time.time())}",
-                "description": "Model group for Cohere models"
-            }
-        elif config_choice == '2':
-            # Get custom configurations
-            print("\nPlease enter your connector details as a JSON object.")
-            connector_payload = self.get_custom_json_input()
-            if not connector_payload:
-                return
-
-            print("\nPlease enter your model group details as a JSON object.")
-            model_group_payload = self.get_custom_json_input()
-            if not model_group_payload:
-                return
-        else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-            return
-
-        # Register the connector
-        try:
-            connector_response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/connectors/_create",
-                body=connector_payload
-            )
-            connector_id = connector_response.get('connector_id')
-            if not connector_id:
-                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
-                return
-            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
-            return
-
-        # Create model group
-        try:
-            model_group_response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/model_groups/_register",
-                body=model_group_payload
-            )
-            model_group_id = model_group_response.get('model_group_id')
-            if not model_group_id:
-                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
-                return
-            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
-            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
-                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
-                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
-            else:
-                return
-
-        # Create model payload
-        model_payload = {
-            "name": connector_payload.get('name', 'Cohere embedding model'),
-            "function_name": "REMOTE",
-            "model_group_id": model_group_id,
-            "description": connector_payload.get('description', 'Cohere embedding model for semantic search'),
-            "connector_id": connector_id
-        }
-
-        # Register the model
-        try:
-            response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
-            )
-            task_id = response.get('task_id')
-            if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
-                # Wait for the task to complete and retrieve the model_id
-                model_id = self.wait_for_model_registration(task_id)
-                if model_id:
-                    # Deploy the model
-                    deploy_response = self.opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
-                    )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    self.config['embedding_model_id'] = model_id
-                    self.save_config(self.config)
-                else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
-            else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
-
-    def register_openai_model_opensource(self):
-        """
-        Register an OpenAI embedding model in open-source OpenSearch.
-        """
-        openai_api_key = input("Enter your OpenAI API key: ").strip()
-        if not openai_api_key:
-            print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
-            return
-
-        print("\nDo you want to use the default configuration or provide custom settings?")
-        print("1. Use default configuration")
-        print("2. Provide custom settings")
-        config_choice = input("Enter your choice (1-2): ").strip()
-
-        if config_choice == '1':
-            # Use default configurations
-            connector_payload = {
-                "name": "OpenAI Embedding Connector",
-                "description": "Connector for OpenAI embedding model",
-                "version": "1",
-                "protocol": "http",
-                "parameters": {
-                    "model": "text-embedding-ada-002"
-                },
-                "credential": {
-                    "openAI_key": openai_api_key
-                },
-                "actions": [
-                    {
-                        "action_type": "predict",
-                        "method": "POST",
-                        "url": "https://api.openai.com/v1/embeddings",
-                        "headers": {
-                            "Authorization": "Bearer ${credential.openAI_key}",
-                            "Content-Type": "application/json"
-                        },
-                        "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
-                        "pre_process_function": "connector.pre_process.openai.embedding",
-                        "post_process_function": "connector.post_process.openai.embedding"
-                    }
-                ]
-            }
-            model_group_payload = {
-                "name": f"openai_model_group_{int(time.time())}",
-                "description": "Model group for OpenAI models"
-            }
-        elif config_choice == '2':
-            # Get custom configurations
-            print("\nPlease enter your connector details as a JSON object.")
-            connector_payload = self.get_custom_json_input()
-            if not connector_payload:
-                return
-
-            print("\nPlease enter your model group details as a JSON object.")
-            model_group_payload = self.get_custom_json_input()
-            if not model_group_payload:
-                return
-        else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-            return
-
-        # Register the connector
-        try:
-            connector_response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/connectors/_create",
-                body=connector_payload
-            )
-            connector_id = connector_response.get('connector_id')
-            if not connector_id:
-                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
-                return
-            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
-            return
-
-        # Create model group
-        try:
-            model_group_response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/model_groups/_register",
-                body=model_group_payload
-            )
-            model_group_id = model_group_response.get('model_group_id')
-            if not model_group_id:
-                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
-                return
-            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
-            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
-                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
-                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
-            else:
-                return
-
-        # Create model payload
-        model_payload = {
-            "name": connector_payload.get('name', 'OpenAI embedding model'),
-            "function_name": "REMOTE",
-            "model_group_id": model_group_id,
-            "description": connector_payload.get('description', 'OpenAI embedding model for semantic search'),
-            "connector_id": connector_id
-        }
-
-        # Register the model
-        try:
-            response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
-            )
-            task_id = response.get('task_id')
-            if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
-                # Wait for the task to complete and retrieve the model_id
-                model_id = self.wait_for_model_registration(task_id)
-                if model_id:
-                    # Deploy the model
-                    deploy_response = self.opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
-                    )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    self.config['embedding_model_id'] = model_id
-                    self.save_config(self.config)
-                else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
-            else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
-
-    def get_custom_json_input(self):
-        """Helper method to get custom JSON input from the user."""
-        json_input = input("Enter your JSON object: ").strip()
-        try:
-            return json.loads(json_input)
-        except json.JSONDecodeError as e:
-            print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
-            return None
-
-
-    def get_model_id_from_task(self, task_id, timeout=600, interval=10):
-        """
-        Wait for the model registration task to complete and return the model_id.
-        """
-        import time
-        end_time = time.time() + timeout
-        while time.time() < end_time:
-            try:
-                response = self.opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
-                )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
-                    return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
-                    return None
-                else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
-                    time.sleep(interval)
-            except Exception as ex:
-                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
-                time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
-
-    def register_huggingface_model(self):
-        """
-        Register a Hugging Face Transformers model in open-source OpenSearch.
-        """
-        print("\nDo you want to use the default configuration or provide custom settings?")
-        print("1. Use default configuration")
-        print("2. Provide custom settings")
-        config_choice = input("Enter your choice (1-2): ").strip()
-
-        if config_choice == '1':
-            # Use default configurations
-            model_name = "sentence-transformers/all-MiniLM-L6-v2"
-            model_payload = {
-                "name": f"huggingface_{model_name.split('/')[-1]}",
-                "model_format": "TORCH_SCRIPT",
-                "model_config": {
-                    "embedding_dimension": self.embedding_dimension,
-                    "framework_type": "SENTENCE_TRANSFORMERS",
-                    "model_type": "bert",
-                    "embedding_model": model_name
-                },
-                "description": f"Hugging Face Transformers model: {model_name}"
-            }
-        elif config_choice == '2':
-            # Get custom configurations
-            model_name = input("Enter the Hugging Face model ID (e.g., 'sentence-transformers/all-MiniLM-L6-v2'): ").strip()
-            if not model_name:
-                print(f"{Fore.RED}Model ID is required. Aborting.{Style.RESET_ALL}")
-                return
-
-            print("\nPlease enter your model details as a JSON object.")
-            print("Example:")
-            example_payload = {
-                "name": f"huggingface_{model_name.split('/')[-1]}",
-                "model_format": "TORCH_SCRIPT",
-                "model_config": {
-                    "embedding_dimension": self.embedding_dimension,
-                    "framework_type": "SENTENCE_TRANSFORMERS",
-                    "model_type": "bert",
-                    "embedding_model": model_name
-                },
-                "description": f"Hugging Face Transformers model: {model_name}"
-            }
-            print(json.dumps(example_payload, indent=2))
-            
-            model_payload = self.get_custom_json_input()
-            if not model_payload:
-                return
-        else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-            return
-
-        # Register the model
-        try:
-            response = self.opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
-            )
-            task_id = response.get('task_id')
-            if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
-                # Wait for the task to complete and retrieve the model_id
-                model_id = self.wait_for_model_registration(task_id)
-                if model_id:
-                    # Deploy the model
-                    deploy_response = self.opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
-                    )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    self.config['embedding_model_id'] = model_id
-                    self.save_config(self.config)
-                else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
-            else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
-        except Exception as ex:
-            print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
-
-    def wait_for_model_registration(self, task_id, timeout=600, interval=10):
-        """
-        Wait for the model registration task to complete and return the model_id.
-        """
-        import time
-        end_time = time.time() + timeout
-        while time.time() < end_time:
-            try:
-                response = self.opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
-                )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
-                    return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
-                    return None
-                else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
-                    time.sleep(interval)
-            except Exception as ex:
-                print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
-                time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
-
-def register_custom_pytorch_model(self):
-    """
-    Register a custom PyTorch model in open-source OpenSearch.
-    """
-    print("\nDo you want to use the default configuration or provide custom settings?")
-    print("1. Use default configuration")
-    print("2. Provide custom settings")
-    config_choice = input("Enter your choice (1-2): ").strip()
-
-    if config_choice == '1':
-        # Use default configurations
-        model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
-        if not os.path.isfile(model_path):
-            print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
-            return
-
-        model_name = os.path.basename(model_path).split('.')[0]
-        model_payload = {
-            "name": f"custom_pytorch_{model_name}",
-            "model_format": "TORCH_SCRIPT",
-            "model_config": {
-                "embedding_dimension": self.embedding_dimension,
-                "framework_type": "CUSTOM",
-                "model_type": "bert"
-            },
-            "description": f"Custom PyTorch model: {model_name}"
-        }
-    elif config_choice == '2':
-        # Get custom configurations
-        model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
-        if not os.path.isfile(model_path):
-            print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
-            return
-
-        print("\nPlease enter your model details as a JSON object.")
-        print("Example:")
-        example_payload = {
-            "name": "custom_pytorch_model",
-            "model_format": "TORCH_SCRIPT",
-            "model_config": {
-                "embedding_dimension": self.embedding_dimension,
-                "framework_type": "CUSTOM",
-                "model_type": "bert"
-            },
-            "description": "Custom PyTorch model for semantic search"
-        }
-        print(json.dumps(example_payload, indent=2))
-        
-        model_payload = self.get_custom_json_input()
-        if not model_payload:
-            return
-    else:
-        print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-        return
-
-    # Upload the model file to OpenSearch
-    try:
-        with open(model_path, 'rb') as f:
-            model_content = f.read()
-
-        # Use the ML plugin's model upload API
-        upload_response = self.opensearch_client.transport.perform_request(
-            method="POST",
-            url="/_plugins/_ml/models/_upload",
-            params={"model_name": model_payload['name']},
-            body=model_content,
-            headers={'Content-Type': 'application/octet-stream'}
-        )
-        if 'model_id' not in upload_response:
-            print(f"{Fore.RED}Failed to upload model. Response: {upload_response}{Style.RESET_ALL}")
-            return
-        model_id = upload_response['model_id']
-        print(f"{Fore.GREEN}Model uploaded successfully. Model ID: {model_id}{Style.RESET_ALL}")
-    except Exception as ex:
-        print(f"{Fore.RED}Error uploading model: {ex}{Style.RESET_ALL}")
-        return
-
-    # Add the model_id to the payload
-    model_payload['model_id'] = model_id
-
-    # Register the model
-    try:
-        response = self.opensearch_client.transport.perform_request(
-            method="POST",
-            url="/_plugins/_ml/models/_register",
-            body=model_payload
-        )
-        task_id = response.get('task_id')
-        if task_id:
-            print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
-            # Wait for the task to complete and retrieve the model_id
-            registered_model_id = self.wait_for_model_registration(task_id)
-            if registered_model_id:
-                # Deploy the model
-                deploy_response = self.opensearch_client.transport.perform_request(
-                    method="POST",
-                    url=f"/_plugins/_ml/models/{registered_model_id}/_deploy"
-                )
-                print(f"{Fore.GREEN}Model deployed successfully. Model ID: {registered_model_id}{Style.RESET_ALL}")
-                self.config['embedding_model_id'] = registered_model_id
-                self.save_config(self.config)
-            else:
-                print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
-        else:
-            print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
-    except Exception as ex:
-        print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
+            return
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index ee8aa66f..03577be0 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -2,25 +2,22 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
+# Any modifications Copyright OpenSearch Contributors.
+# See GitHub history for details.
+# Licensed to Elasticsearch B.V. under one or more contributor
+# license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright
+# ownership. Elasticsearch B.V. licenses this file to you under
+# the Apache License, Version 2.0 (the "License"); you may
+# not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+# http://www.apache.org/licenses/LICENSE-2.0
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
 
 import boto3
 import botocore
@@ -41,6 +38,7 @@
 import ssl
 
 init(autoreset=True)
+
 class Setup:
     CONFIG_FILE = 'config.ini'
     SERVICE_AOSS = 'opensearchserverless'
@@ -172,13 +170,12 @@ def get_password_with_asterisks(self, prompt="Enter password: "):
                         sys.stdout.flush()
             finally:
                 termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
+
     def setup_configuration(self):
         # Set up the configuration by prompting the user for various settings
         config = self.load_config()
 
-        self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
-        self.iam_principal = input(f"Enter your IAM Principal ARN [{config.get('iam_principal', '')}]: ") or config.get('iam_principal', '')
-
+        # First, prompt for service type
         print("Choose OpenSearch service type:")
         print("1. Serverless")
         print("2. Managed")
@@ -195,20 +192,29 @@ def setup_configuration(self):
             print("Invalid choice. Defaulting to 'managed'")
             self.service_type = 'managed'
 
-        if self.service_type == 'serverless':
-            self.collection_name = input("Enter the name for your OpenSearch collection: ")
-            self.opensearch_endpoint = None
-            self.opensearch_username = None
-            self.opensearch_password = None
-        elif self.service_type == 'managed':
-            self.opensearch_endpoint = input("Enter your OpenSearch domain endpoint: ")
-            self.opensearch_username = input("Enter your OpenSearch username: ")
-            self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
-            self.collection_name = ''
+        # Based on service type, prompt for different configurations
+        if self.service_type in ['serverless', 'managed']:
+            # For 'serverless' and 'managed', prompt for AWS credentials and related info
+            self.check_and_configure_aws()
+
+            self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
+            self.iam_principal = input(f"Enter your IAM Principal ARN [{config.get('iam_principal', '')}]: ") or config.get('iam_principal', '')
+
+            if self.service_type == 'serverless':
+                self.collection_name = input("Enter the name for your OpenSearch collection: ")
+                self.opensearch_endpoint = None
+                self.opensearch_username = None
+                self.opensearch_password = None
+            elif self.service_type == 'managed':
+                self.opensearch_endpoint = input("Enter your OpenSearch domain endpoint: ")
+                self.opensearch_username = input("Enter your OpenSearch username: ")
+                self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
+                self.collection_name = ''
         elif self.service_type == 'open-source':
-            # For open-source, allow default endpoint
+            # For 'open-source', skip AWS configurations
+            print("\n--- Open-source OpenSearch Setup ---")
             default_endpoint = 'https://localhost:9200'
-            self.opensearch_endpoint = input(f"Press Enter to use the default endpoint(or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
+            self.opensearch_endpoint = input(f"Press Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
             auth_required = input("Does your OpenSearch instance require authentication? (yes/no): ").strip().lower()
             if auth_required == 'yes':
                 self.opensearch_username = input("Enter your OpenSearch username: ")
@@ -217,25 +223,28 @@ def setup_configuration(self):
                 self.opensearch_username = None
                 self.opensearch_password = None
             self.collection_name = ''
-            # For open-source, we may not need AWS region and IAM principal
+            # For open-source, AWS region and IAM principal are not needed
             self.aws_region = ''
             self.iam_principal = ''
 
-        # Remove index_name from configuration at this point
+        # Update configuration dictionary
         self.config = {
+            'service_type': self.service_type,
             'region': self.aws_region,
             'iam_principal': self.iam_principal,
             'collection_name': self.collection_name if self.collection_name else '',
-            'service_type': self.service_type,
             'opensearch_endpoint': self.opensearch_endpoint if self.opensearch_endpoint else '',
             'opensearch_username': self.opensearch_username if self.opensearch_username else '',
             'opensearch_password': self.opensearch_password if self.opensearch_password else ''
         }
         self.save_config(self.config)
-        print("Configuration saved successfully.")
+        print("Configuration saved successfully.\n")
 
     def initialize_clients(self):
-        # Initialize AWS clients (AOSS and Bedrock)
+        # Initialize AWS clients (AOSS and Bedrock) only if not open-source
+        if self.service_type == 'open-source':
+            return True  # No AWS clients needed
+
         try:
             boto_config = Config(
                 region_name=self.aws_region,
@@ -247,7 +256,7 @@ def initialize_clients(self):
             self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region)
             
             time.sleep(7)
-            print("AWS clients initialized successfully.")
+            print("AWS clients initialized successfully.\n")
             return True
         except Exception as e:
             print(f"Failed to initialize AWS clients: {e}")
@@ -256,7 +265,7 @@ def initialize_clients(self):
     def create_security_policies(self):
         # Create security policies for serverless OpenSearch
         if not self.is_serverless:
-            print("Security policies are not applicable for managed OpenSearch domains.")
+            print("Security policies are not applicable for managed OpenSearch domains.\n")
             return
         
         encryption_policy = json.dumps({
@@ -302,11 +311,11 @@ def create_access_policy(self, name, description, policy_body):
         # Create a data access policy
         try:
             self.aoss_client.create_access_policy(description=description, name=name, policy=policy_body, type="data")
-            print(f"Data Access Policy '{name}' created successfully.")
+            print(f"Data Access Policy '{name}' created successfully.\n")
         except self.aoss_client.exceptions.ConflictException:
-            print(f"Data Access Policy '{name}' already exists.")
+            print(f"Data Access Policy '{name}' already exists.\n")
         except Exception as ex:
-            print(f"Error creating data access policy '{name}': {ex}")
+            print(f"Error creating data access policy '{name}': {ex}\n")
 
     def create_collection(self, collection_name, max_retries=3):
         # Create an OpenSearch serverless collection
@@ -339,6 +348,7 @@ def get_collection_id(self, collection_name):
         except Exception as ex:
             print(f"Error getting collection ID: {ex}")
         return None
+
     def get_opensearch_domain_name(self):
         """
         Extract the domain name from the OpenSearch endpoint URL.
@@ -355,9 +365,11 @@ def get_opensearch_domain_name(self):
                     domain_part = domain_part[len('search-'):]
                 # Remove the unique ID suffix after the domain name
                 domain_name = domain_part.rsplit('-', 1)[0]
-                print(f"Extracted domain name: {domain_name}")
+                print(f"Extracted domain name: {domain_name}\n")
                 return domain_name
         return None
+
+    @staticmethod
     def get_opensearch_domain_info(region, domain_name):
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
@@ -382,10 +394,10 @@ def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
                 response = self.aoss_client.batch_get_collection(ids=[collection_id])
                 status = response['collectionDetails'][0]['status']
                 if status == 'ACTIVE':
-                    print(f"Collection '{self.collection_name}' is now active.")
+                    print(f"Collection '{self.collection_name}' is now active.\n")
                     return True
                 elif status in ['FAILED', 'DELETED']:
-                    print(f"Collection creation failed or was deleted. Status: {status}")
+                    print(f"Collection creation failed or was deleted. Status: {status}\n")
                     return False
                 else:
                     print(f"Collection status: {status}. Waiting...")
@@ -393,7 +405,7 @@ def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
             except Exception as ex:
                 print(f"Error checking collection status: {ex}")
                 time.sleep(30)
-        print(f"Timed out waiting for collection to become active after {max_wait_minutes} minutes.")
+        print(f"Timed out waiting for collection to become active after {max_wait_minutes} minutes.\n")
         return False
 
     def get_collection_endpoint(self):
@@ -404,26 +416,27 @@ def get_collection_endpoint(self):
         try:
             collection_id = self.get_collection_id(self.collection_name)
             if not collection_id:
-                print(f"Collection '{self.collection_name}' not found.")
+                print(f"Collection '{self.collection_name}' not found.\n")
                 return None
             
             batch_get_response = self.aoss_client.batch_get_collection(ids=[collection_id])
             collection_details = batch_get_response.get('collectionDetails', [])
             
             if not collection_details:
-                print(f"No details found for collection ID '{collection_id}'.")
+                print(f"No details found for collection ID '{collection_id}'.\n")
                 return None
             
             self.opensearch_endpoint = collection_details[0].get('collectionEndpoint')
             if self.opensearch_endpoint:
-                print(f"Collection '{self.collection_name}' has endpoint URL: {self.opensearch_endpoint}")
+                print(f"Collection '{self.collection_name}' has endpoint URL: {self.opensearch_endpoint}\n")
                 return self.opensearch_endpoint
             else:
-                print(f"No endpoint URL found in collection '{self.collection_name}'.")
+                print(f"No endpoint URL found in collection '{self.collection_name}'.\n")
                 return None
         except Exception as ex:
-            print(f"Error retrieving collection endpoint: {ex}")
+            print(f"Error retrieving collection endpoint: {ex}\n")
             return None
+
     def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
         Extract the IAM user name from the IAM principal ARN.
@@ -433,23 +446,23 @@ def get_iam_user_name_from_arn(self, iam_principal_arn):
             return iam_principal_arn.split(':user/')[-1]
         else:
             return None
-        
+
     def initialize_opensearch_client(self):
         # Initialize the OpenSearch client
         if not self.opensearch_endpoint:
-            print("OpenSearch endpoint not set. Please run setup first.")
+            print("OpenSearch endpoint not set. Please run setup first.\n")
             return False
 
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
         port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
-        if self.is_serverless:
+        if self.service_type in ['managed', 'serverless']:
             credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss') if self.is_serverless else AWSV4SignerAuth(credentials, self.aws_region, 'es')
         else:
             if not self.opensearch_username or not self.opensearch_password:
-                print("OpenSearch username or password not set. Please run setup first.")
+                print("OpenSearch username or password not set. Please run setup first.\n")
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
 
@@ -475,10 +488,10 @@ def initialize_opensearch_client(self):
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
-            print(f"Initialized OpenSearch client with host: {host} and port: {port}")
+            print(f"Initialized OpenSearch client with host: {host} and port: {port}\n")
             return True
         except Exception as ex:
-            print(f"Error initializing OpenSearch client: {ex}")
+            print(f"Error initializing OpenSearch client: {ex}\n")
             return False
 
     def get_knn_index_details(self):
@@ -526,11 +539,10 @@ def get_knn_index_details(self):
                 print("Invalid input. Using default ef_construction of 512.")
                 ef_construction = 512
 
-        print(f"ef_construction set to: {ef_construction}")
+        print(f"ef_construction set to: {ef_construction}\n")
 
         return embedding_dimension, space_type, ef_construction
 
-
     def create_index(self, embedding_dimension, space_type, ef_construction):
         # Create the KNN index in OpenSearch
         index_body = {
@@ -559,31 +571,28 @@ def create_index(self, embedding_dimension, space_type, ef_construction):
         }
         try:
             self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.")
+            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.\n")
         except Exception as e:
             if 'resource_already_exists_exception' in str(e).lower():
-                print(f"Index '{self.index_name}' already exists.")
+                print(f"Index '{self.index_name}' already exists.\n")
             else:
-                print(f"Error creating index '{self.index_name}': {e}")
-
-
+                print(f"Error creating index '{self.index_name}': {e}\n")
 
     def verify_and_create_index(self, embedding_dimension, space_type, ef_construction):
         try:
             print(f"Attempting to verify index '{self.index_name}'...")
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
-                print(f"KNN index '{self.index_name}' already exists.")
+                print(f"KNN index '{self.index_name}' already exists.\n")
             else:
-                print(f"Index '{self.index_name}' does not exist. Attempting to create...")
+                print(f"Index '{self.index_name}' does not exist. Attempting to create...\n")
                 self.create_index(embedding_dimension, space_type, ef_construction)
             return True
         except Exception as ex:
             print(f"Error verifying or creating index: {ex}")
-            print(f"OpenSearch client config: {self.opensearch_client.transport.hosts}")
+            print(f"OpenSearch client config: {self.opensearch_client.transport.hosts}\n")
             return False
 
-
     def get_truncated_name(self, base_name, max_length=32):
         # Truncate a name to fit within a specified length
         if len(base_name) <= max_length:
@@ -591,11 +600,11 @@ def get_truncated_name(self, base_name, max_length=32):
         return base_name[:max_length-3] + "..."
 
     def setup_command(self):
-        self.check_and_configure_aws()
+        # Main setup command
         self.setup_configuration()
         
         if self.service_type != 'open-source' and not self.initialize_clients():
-            print(f"{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}")
+            print(f"{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n")
             return
         
         if self.service_type == 'serverless':
@@ -609,35 +618,35 @@ def setup_command(self):
                 if self.wait_for_collection_active(collection_id):
                     self.opensearch_endpoint = self.get_collection_endpoint()
                     if not self.opensearch_endpoint:
-                        print(f"{Fore.RED}Failed to retrieve OpenSearch endpoint. Setup incomplete.{Style.RESET_ALL}")
+                        print(f"{Fore.RED}Failed to retrieve OpenSearch endpoint. Setup incomplete.{Style.RESET_ALL}\n")
                         return
                     else:
                         self.config['opensearch_endpoint'] = self.opensearch_endpoint
                         self.save_config(self.config)
                         self.opensearch_domain_name = self.get_opensearch_domain_name()
                 else:
-                    print(f"{Fore.RED}Collection is not active. Setup incomplete.{Style.RESET_ALL}")
+                    print(f"{Fore.RED}Collection is not active. Setup incomplete.{Style.RESET_ALL}\n")
                     return
         elif self.service_type == 'managed':
             if not self.opensearch_endpoint:
-                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}")
+                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
             else:
                 self.opensearch_domain_name = self.get_opensearch_domain_name()
         elif self.service_type == 'open-source':
             # Open-source setup
             if not self.opensearch_endpoint:
-                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}")
+                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
             else:
                 self.opensearch_domain_name = None  # Not required for open-source
 
         # Initialize OpenSearch client
         if self.initialize_opensearch_client():
-            print(f"{Fore.GREEN}OpenSearch client initialized successfully.{Style.RESET_ALL}")
+            print(f"{Fore.GREEN}OpenSearch client initialized successfully.{Style.RESET_ALL}\n")
             
             # Prompt user to choose between creating a new index or using an existing one
-            print("\nDo you want to create a new KNN index or use an existing one?")
+            print("Do you want to create a new KNN index or use an existing one?")
             print("1. Create a new KNN index")
             print("2. Use an existing KNN index")
             index_choice = input("Enter your choice (1-2): ").strip()
@@ -650,36 +659,45 @@ def setup_command(self):
                 self.config['index_name'] = self.index_name
                 self.save_config(self.config)
         
-                print("Proceeding with index creation...")
+                print("Proceeding with index creation...\n")
                 embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
                 
                 if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
-                    print(f"{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}")
+                    print(f"{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
                     # Save index details to config
                     self.config['embedding_dimension'] = str(embedding_dimension)
                     self.config['space_type'] = space_type
                     self.config['ef_construction'] = str(ef_construction)
                     self.save_config(self.config)
                 else:
-                    print(f"{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}")
+                    print(f"{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
                     return
             elif index_choice == '2':
                 # Use existing index
                 existing_index_name = input("Enter the name of your existing KNN index: ").strip()
                 if not existing_index_name:
-                    print(f"{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}")
+                    print(f"{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n")
                     return
                 self.index_name = existing_index_name
                 self.config['index_name'] = self.index_name
                 self.save_config(self.config)
                 # Load index details from config or prompt for them
                 if 'embedding_dimension' in self.config and 'space_type' in self.config and 'ef_construction' in self.config:
-                    embedding_dimension = int(self.config['embedding_dimension'])
-                    space_type = self.config['space_type']
-                    ef_construction = int(self.config['ef_construction'])
-                    print(f"Using existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.")
+                    try:
+                        embedding_dimension = int(self.config['embedding_dimension'])
+                        space_type = self.config['space_type']
+                        ef_construction = int(self.config['ef_construction'])
+                        print(f"Using existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.\n")
+                    except ValueError:
+                        print("Invalid index details in configuration. Prompting for details again.\n")
+                        embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
+                        # Save index details to config
+                        self.config['embedding_dimension'] = str(embedding_dimension)
+                        self.config['space_type'] = space_type
+                        self.config['ef_construction'] = str(ef_construction)
+                        self.save_config(self.config)
                 else:
-                    print("Index details not found in configuration.")
+                    print("Index details not found in configuration. Prompting for details.\n")
                     embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
                     # Save index details to config
                     self.config['embedding_dimension'] = str(embedding_dimension)
@@ -688,10 +706,10 @@ def setup_command(self):
                     self.save_config(self.config)
                 # Verify that the index exists
                 if not self.opensearch_client.indices.exists(index=self.index_name):
-                    print(f"{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}")
+                    print(f"{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
                     return
             else:
-                print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}")
+                print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}\n")
                 return
 
             # Proceed with model registration
@@ -710,4 +728,4 @@ def setup_command(self):
                 # Open-source OpenSearch: Provide instructions or automate model registration
                 self.model_register.prompt_opensource_model_registration()
         else:
-            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}")
\ No newline at end of file
+            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
\ No newline at end of file

From da834d2da1d5eb8967da1502a186bb2c464c888d Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 29 Nov 2024 05:14:56 -0800
Subject: [PATCH 15/42] Remove base_model.py from rag pipeline

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/ml_models/base_model.py         | 12 ------------
 1 file changed, 12 deletions(-)
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py
deleted file mode 100644
index 7ca846a1..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/base_model.py
+++ /dev/null
@@ -1,12 +0,0 @@
-# models/base_model.py
-
-from abc import ABC, abstractmethod
-
-class BaseModelRegister(ABC):
-    def __init__(self, config, helper):
-        self.config = config
-        self.helper = helper
-
-    @abstractmethod
-    def register_model(self):
-        pass
\ No newline at end of file

From 9c45e432728ee2840dd5d3f2db37c11377f38cda Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 29 Nov 2024 06:34:33 -0800
Subject: [PATCH 16/42] Licence header

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag/ml_models/BedrockModel.py             | 24 ++++++++++++++++++-
 .../rag_pipeline/rag/ml_models/CohereModel.py | 24 ++++++++++++++++++-
 .../rag/ml_models/CustomPyTorchModel.py       | 24 ++++++++++++++++++-
 .../rag/ml_models/HuggingFaceModel.py         | 24 ++++++++++++++++++-
 .../rag_pipeline/rag/ml_models/OpenAIModel.py | 24 ++++++++++++++++++-
 .../rag/ml_models/SageMakerModel.py           | 24 ++++++++++++++++++-
 6 files changed, 138 insertions(+), 6 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
index 0b63787e..60bd55f3 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
@@ -1,4 +1,26 @@
-# BedrockModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 
 import json
 from colorama import Fore, Style
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
index ef84362d..01c2d1dd 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
@@ -1,4 +1,26 @@
-# CohereModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
index 6c6379f6..f5163629 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
@@ -1,4 +1,26 @@
-# CustomPyTorchModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 import json
 from colorama import Fore, Style
 import os
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
index 77765845..b1bda520 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
@@ -1,4 +1,26 @@
-# HuggingFaceModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
index 1fc8a937..ed72eaa2 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
@@ -1,4 +1,26 @@
-# OpenAIModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
index 3288a8a2..2f7975ed 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
@@ -1,4 +1,26 @@
-# SageMakerModel.py
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 import json
 from colorama import Fore, Style
 

From a61a84036b6baef7a4c069c6385a08f6913ec24b Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Mon, 2 Dec 2024 13:48:52 -0800
Subject: [PATCH 17/42] Updated user setup, Added Semantic search for Managed
 service using ML Models, Added Neural search for non managed service., Added
 UT, Update to Changelog to reflect recent changes and to past tests. Modified
 setup.py to pass integration tests.

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 CHANGELOG.md                                  |   1 +
 .../rag_pipeline/rag/IAMRoleHelper.py         |  96 ++--
 .../rag_pipeline/rag/SecretsHelper.py         |  54 +-
 .../ml_commons/rag_pipeline/rag/ingest.py     | 253 ++++-----
 .../rag/ml_models/BedrockModel.py             |  16 +-
 ...{CustomPyTorchModel.py => PyTorchModel.py} |   0
 .../rag_pipeline/rag/model_register.py        |   3 +-
 .../rag_pipeline/rag/opensearch_connector.py  |  25 +-
 .../ml_commons/rag_pipeline/rag/query.py      | 304 ++++++++--
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 532 +++++++++---------
 .../ml_commons/rag_pipeline/rag/serverless.py | 240 ++++++++
 setup.py                                      |   1 -
 tests/rag/test_AiConnectorClass.py            | 518 +++++++++++++++++
 tests/rag/test_IAMRoleHelper.py               | 320 +++++++++++
 tests/rag/test_Model_Register.py              | 201 +++++++
 tests/rag/test_SecretsHelper                  | 137 +++++
 tests/rag/test_ingest.py                      | 223 ++++++++
 tests/rag/test_ml_models/test_BedrockModel.py | 116 ++++
 tests/rag/test_ml_models/test_CohereModel.py  | 158 ++++++
 tests/rag/test_ml_models/test_OpenAIModel.py  | 157 ++++++
 tests/rag/test_ml_models/test_PyTorchModel.py | 162 ++++++
 .../rag/test_ml_models/test_SageMakerModel.py | 137 +++++
 tests/rag/test_opensearch_connector.py        | 249 ++++++++
 tests/rag/test_query.py                       | 278 +++++++++
 tests/rag/test_rag.py                         | 166 ++++++
 tests/rag/test_rag_setup.py                   | 209 +++++++
 tests/rag/test_serverless.py                  | 232 ++++++++
 27 files changed, 4254 insertions(+), 534 deletions(-)
 rename opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/{CustomPyTorchModel.py => PyTorchModel.py} (100%)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
 create mode 100644 tests/rag/test_AiConnectorClass.py
 create mode 100644 tests/rag/test_IAMRoleHelper.py
 create mode 100644 tests/rag/test_Model_Register.py
 create mode 100644 tests/rag/test_SecretsHelper
 create mode 100644 tests/rag/test_ingest.py
 create mode 100644 tests/rag/test_ml_models/test_BedrockModel.py
 create mode 100644 tests/rag/test_ml_models/test_CohereModel.py
 create mode 100644 tests/rag/test_ml_models/test_OpenAIModel.py
 create mode 100644 tests/rag/test_ml_models/test_PyTorchModel.py
 create mode 100644 tests/rag/test_ml_models/test_SageMakerModel.py
 create mode 100644 tests/rag/test_opensearch_connector.py
 create mode 100644 tests/rag/test_query.py
 create mode 100644 tests/rag/test_rag.py
 create mode 100644 tests/rag/test_rag_setup.py
 create mode 100644 tests/rag/test_serverless.py

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c239c208..c5c375db 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -46,6 +46,7 @@ Inspired from [Keep a Changelog](https://keepachangelog.com/en/1.0.0/)
 - updating listing file with three v2 sparse model - by @dhrubo-os ([#412](https://github.com/opensearch-project/opensearch-py-ml/pull/412))
 - Update model upload history -  opensearch-project/opensearch-neural-sparse-encoding-doc-v2-mini (v.1.0.0)(TORCH_SCRIPT) by @dhrubo-os ([#417](https://github.com/opensearch-project/opensearch-py-ml/pull/417))
 - Update model upload history -  opensearch-project/opensearch-neural-sparse-encoding-v2-distill (v.1.0.0)(TORCH_SCRIPT) by @dhrubo-os ([#419](https://github.com/opensearch-project/opensearch-py-ml/pull/419))
+- Added RAG functionality into `opensearch-py-ml` by @hmumtazz in ([#427](https://github.com/opensearch-project/opensearch-py-ml/pull/427))
 
 ### Fixed
 - Fix the wrong final zip file name in model_uploader workflow, now will name it by the upload_prefix alse.([#413](https://github.com/opensearch-project/opensearch-py-ml/pull/413/files))
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
index e39968b0..bbb62f1c 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
@@ -24,7 +24,7 @@
 
 import boto3
 import json
-from botocore.exceptions import BotoCoreError
+from botocore.exceptions import ClientError
 import requests
 
 class IAMRoleHelper:
@@ -44,8 +44,12 @@ def role_exists(self, role_name):
         try:
             iam_client.get_role(RoleName=role_name)
             return True
-        except iam_client.exceptions.NoSuchEntityException:
-            return False
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'NoSuchEntity':
+                return False
+            else:
+                print(f"An error occurred: {e}")
+                return False
 
     def delete_role(self, role_name):
         iam_client = boto3.client('iam')
@@ -67,8 +71,11 @@ def delete_role(self, role_name):
             iam_client.delete_role(RoleName=role_name)
             print(f'Role {role_name} deleted.')
 
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f'Role {role_name} does not exist.')
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'NoSuchEntity':
+                print(f'Role {role_name} does not exist.')
+            else:
+                print(f"An error occurred: {e}")
 
     def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
         iam_client = boto3.client('iam')
@@ -94,7 +101,7 @@ def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
             print(f'Created role: {role_name}')
             return role_arn
 
-        except Exception as e:
+        except ClientError as e:
             print(f"Error creating the role: {e}")
             return None
 
@@ -106,12 +113,13 @@ def get_role_arn(self, role_name):
             response = iam_client.get_role(RoleName=role_name)
             # Return ARN of the role
             return response['Role']['Arn']
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f"The requested role {role_name} does not exist")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'NoSuchEntity':
+                print(f"The requested role {role_name} does not exist")
+                return None
+            else:
+                print(f"An error occurred: {e}")
+                return None
 
     def get_role_details(self, role_name):
         iam = boto3.client('iam')
@@ -135,36 +143,45 @@ def get_role_details(self, role_name):
                 print("Role Policy Document:")
                 print(json.dumps(get_role_policy_response['PolicyDocument'], indent=4, sort_keys=True))
 
-        except iam.exceptions.NoSuchEntityException:
-            print(f'Role {role_name} does not exist.')
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'NoSuchEntity':
+                print(f'Role {role_name} does not exist.')
+            else:
+                print(f"An error occurred: {e}")
 
     def get_user_arn(self, username):
         if not username:
             return None
-        # Create a boto3 client for IAM
         iam_client = boto3.client('iam')
 
         try:
-            # Get information about the IAM user
             response = iam_client.get_user(UserName=username)
             user_arn = response['User']['Arn']
             return user_arn
-        except iam_client.exceptions.NoSuchEntityException:
-            print(f"IAM user '{username}' not found.")
-            return None
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'NoSuchEntity':
+                print(f"IAM user '{username}' not found.")
+                return None
+            else:
+                print(f"An error occurred: {e}")
+                return None
 
     def assume_role(self, role_arn, role_session_name="your_session_name"):
         sts_client = boto3.client('sts')
 
-        assumed_role_object = sts_client.assume_role(
-            RoleArn=role_arn,
-            RoleSessionName=role_session_name,
-        )
+        try:
+            assumed_role_object = sts_client.assume_role(
+                RoleArn=role_arn,
+                RoleSessionName=role_session_name,
+            )
 
-        # Obtain the temporary credentials from the assumed role 
-        temp_credentials = assumed_role_object["Credentials"]
+            # Obtain the temporary credentials from the assumed role 
+            temp_credentials = assumed_role_object["Credentials"]
 
-        return temp_credentials
+            return temp_credentials
+        except ClientError as e:
+            print(f"Error assuming role: {e}")
+            return None
 
     def map_iam_role_to_backend_role(self, iam_role_arn):
         os_security_role = 'ml_full_access'  # Changed from 'all_access' to 'ml_full_access'
@@ -175,19 +192,22 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
         }
         headers = {'Content-Type': 'application/json'}
 
-        response = requests.put(
-            url,
-            auth=(self.opensearch_domain_username, self.opensearch_domain_password),
-            json=payload,
-            headers=headers,
-            verify=True
-        )
+        try:
+            response = requests.put(
+                url,
+                auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+                json=payload,
+                headers=headers,
+                verify=True
+            )
 
-        if response.status_code == 200:
-            print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
-        else:
-            print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
-            print(f"Response: {response.text}")
+            if response.status_code == 200:
+                print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
+            else:
+                print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
+                print(f"Response: {response.text}")
+        except requests.exceptions.RequestException as e:
+            print(f"HTTP request failed: {e}")
 
     def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
index 03825eeb..7c454f57 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
@@ -21,9 +21,13 @@
 #  KIND, either express or implied.  See the License for the
 #  specific language governing permissions and limitations
 #  under the License.
+
+import logging
 import boto3
 import json
-from botocore.exceptions import BotoCoreError
+from botocore.exceptions import ClientError
+
+logger = logging.getLogger(__name__)
 
 class SecretHelper:
     def __init__(self, region):
@@ -32,50 +36,50 @@ def __init__(self, region):
     def secret_exists(self, secret_name):
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
-            # Try to get the secret
             secretsmanager.get_secret_value(SecretId=secret_name)
-            # If no exception was raised by get_secret_value, the secret exists
             return True
-        except secretsmanager.exceptions.ResourceNotFoundException:
-            # If a ResourceNotFoundException was raised, the secret does not exist
-            return False
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+                return False
+            else:
+                logger.error(f"An error occurred: {e}")
+                return False
 
     def get_secret_arn(self, secret_name):
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
             response = secretsmanager.describe_secret(SecretId=secret_name)
-            # Return ARN of the secret 
             return response['ARN']
-        except secretsmanager.exceptions.ResourceNotFoundException:
-            print(f"The requested secret {secret_name} was not found")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+                logger.warning(f"The requested secret {secret_name} was not found")
+                return None
+            else:
+                logger.error(f"An error occurred: {e}")
+                return None
 
     def get_secret(self, secret_name):
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
             response = secretsmanager.get_secret_value(SecretId=secret_name)
-        except secretsmanager.exceptions.NoSuchEntityException:
-            print("The requested secret was not found")
-            return None
-        except Exception as e:
-            print(f"An error occurred: {e}")
-            return None
-        else:
             return response.get('SecretString')
+        except ClientError as e:
+            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+                logger.warning("The requested secret was not found")
+                return None
+            else:
+                logger.error(f"An error occurred: {e}")
+                return None
 
     def create_secret(self, secret_name, secret_value):
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
-
         try:
             response = secretsmanager.create_secret(
                 Name=secret_name,
                 SecretString=json.dumps(secret_value),
             )
-            print(f'Secret {secret_name} created successfully.')
-            return response['ARN']  # Return the ARN of the created secret
-        except BotoCoreError as e:
-            print(f'Error creating secret: {e}')
+            logger.info(f'Secret {secret_name} created successfully.')
+            return response['ARN']
+        except ClientError as e:
+            logger.error(f'Error creating secret: {e}')
             return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 2be1ed06..0ec4ea2c 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -36,15 +35,13 @@
 import botocore
 import time
 import random
-from opensearchpy import exceptions as opensearch_exceptions 
-
+from opensearchpy import exceptions as opensearch_exceptions
 
 from opensearch_connector import OpenSearchConnector
 
 init(autoreset=True)  # Initialize colorama
 
 class Ingest:
-
     def __init__(self, config):
         # Initialize the Ingest class with configuration
         self.config = config
@@ -53,6 +50,7 @@ def __init__(self, config):
         self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
         self.embedding_model_id = config.get('embedding_model_id')
+        self.pipeline_name = config.get('ingest_pipeline_name', 'text-chunking-ingest-pipeline')
 
         if not self.embedding_model_id:
             print("Embedding model ID is not set. Please run setup first.")
@@ -67,13 +65,131 @@ def initialize_clients(self):
             print("Failed to initialize OpenSearch client.")
             return False
 
+    def ingest_command(self, paths: List[str]):
+        # Main ingestion command
+        # Processes all valid files in the given paths and initiates ingestion
+
+        all_files = []
+        for path in paths:
+            if os.path.isfile(path):
+                all_files.append(path)
+            elif os.path.isdir(path):
+                for root, dirs, files in os.walk(path):
+                    for file in files:
+                        all_files.append(os.path.join(root, file))
+            else:
+                print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
+
+        supported_extensions = ['.csv', '.txt', '.pdf']
+        valid_files = [f for f in all_files if any(f.lower().endswith(ext) for ext in supported_extensions)]
+
+        if not valid_files:
+            print(f"{Fore.RED}No valid files found for ingestion.{Style.RESET_ALL}")
+            return
+
+        print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
+
+        self.process_and_ingest_data(valid_files)
+
+    def process_and_ingest_data(self, file_paths: List[str]):
+        if not self.initialize_clients():
+            print("Failed to initialize clients. Aborting ingestion.")
+            return
+
+        # Create the ingest pipeline
+        self.create_ingest_pipeline(self.pipeline_name)
+
+        all_documents = []
+        for file_path in file_paths:
+            print(f"\nProcessing file: {file_path}")
+            documents = self.process_file(file_path)
+            all_documents.extend(documents)
+
+        total_documents = len(all_documents)
+        print(f"\nTotal documents to process: {total_documents}")
+
+        print("\nGenerating embeddings for the documents...")
+        success_count = 0
+        error_count = 0
+        with tqdm(total=total_documents, bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]') as pbar:
+            for doc in all_documents:
+                try:
+                    embedding = self.text_embedding(doc['text'])
+                    if embedding is not None:
+                        doc['embedding'] = embedding
+                        success_count += 1
+                    else:
+                        error_count += 1
+                        print(f"{Fore.RED}Error generating embedding for document: {doc['text'][:50]}...{Style.RESET_ALL}")
+                except Exception as e:
+                    error_count += 1
+                    print(f"{Fore.RED}Error processing document: {str(e)}{Style.RESET_ALL}")
+                pbar.update(1)
+                pbar.set_postfix({'Success': success_count, 'Errors': error_count})
+
+        print(f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}")
+        print(f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}")
+
+        if success_count == 0:
+            print(f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}")
+            return
+
+        print(f"\n{Fore.YELLOW}Ingesting data into OpenSearch...{Style.RESET_ALL}")
+        actions = []
+        for doc in all_documents:
+            if 'embedding' in doc and doc['embedding'] is not None:
+                action = {
+                    "_op_type": "index",
+                    "_index": self.index_name,
+                    "_source": {
+                        "nominee_text": doc['text'],
+                        "nominee_vector": doc['embedding']
+                    },
+                    "pipeline": self.pipeline_name  # Use the pipeline name specified in the config
+                }
+                actions.append(action)
+
+        success, failed = self.opensearch.bulk_index(actions)
+        print(f"\n{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
+        print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
+
+    def create_ingest_pipeline(self, pipeline_id):
+        # Check if pipeline exists
+        try:
+            response = self.opensearch.opensearch_client.ingest.get_pipeline(id=pipeline_id)
+            print(f"\nIngest pipeline '{pipeline_id}' already exists.")
+        except opensearch_exceptions.NotFoundError:
+            # Pipeline does not exist, create it
+            pipeline_body = {
+                "description": "A text chunking ingest pipeline",
+                "processors": [
+                    {
+                        "text_chunking": {
+                            "algorithm": {
+                                "fixed_token_length": {
+                                    "token_limit": 384,
+                                    "overlap_rate": 0.2,
+                                    "tokenizer": "standard"
+                                }
+                            },
+                            "field_map": {
+                                "nominee_text": "passage_chunk"
+                            }
+                        }
+                    }
+                ]
+            }
+            self.opensearch.opensearch_client.ingest.put_pipeline(id=pipeline_id, body=pipeline_body)
+            print(f"\nIngest pipeline '{pipeline_id}' created successfully.")
+        except Exception as e:
+            print(f"\nError checking or creating ingest pipeline: {e}")
 
     def process_file(self, file_path: str) -> List[Dict[str, str]]:
         # Process a file based on its extension
         # Supports CSV, TXT, and PDF files
         # Returns a list of dictionaries containing extracted text
         _, file_extension = os.path.splitext(file_path)
-        
+
         if file_extension.lower() == '.csv':
             return self.process_csv(file_path)
         elif file_extension.lower() == '.txt':
@@ -95,7 +211,6 @@ def process_csv(self, file_path: str) -> List[Dict[str, str]]:
                 documents.append({"text": json.dumps(row)})
         return documents
 
-
     def process_txt(self, file_path: str) -> List[Dict[str, str]]:
         # Process a TXT file
         # Reads the entire content of the file
@@ -139,10 +254,6 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
                     return None
                 output = inference_results[0].get('output')
 
-                # Remove or comment out the debugging print statements
-                # print(f"Output type: {type(output)}")
-                # print(f"Output content: {output}")
-
                 # Adjust the extraction of embedding data
                 if isinstance(output, list) and len(output) > 0:
                     embedding_dict = output[0]
@@ -157,8 +268,6 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
                     print(f"Unexpected embedding output format: {output}")
                     return None
 
-                # Optionally, you can also remove this print statement if you prefer
-                # print(f"Extracted embedding of length {len(embedding)}")
                 return embedding
             except Exception as ex:
                 print(f"Error on attempt {attempt + 1}: {ex}")
@@ -166,122 +275,4 @@ def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2)
                     raise
                 time.sleep(delay)
                 delay *= backoff_factor
-        return None
-    def create_ingest_pipeline(self):
-        pipeline_id = 'text-chunking-ingest-pipeline'
-        # Check if pipeline exists
-        try:
-            response = self.opensearch.opensearch_client.ingest.get_pipeline(id=pipeline_id)
-            print(f"Ingest pipeline '{pipeline_id}' already exists.")
-        except opensearch_exceptions.NotFoundError:
-            # Pipeline does not exist, create it
-            pipeline_body = {
-                "description": "A text chunking ingest pipeline",
-                "processors": [
-                    {
-                        "text_chunking": {
-                            "algorithm": {
-                                "fixed_token_length": {
-                                    "token_limit": 384,
-                                    "overlap_rate": 0.2,
-                                    "tokenizer": "standard"
-                                }
-                            },
-                            "field_map": {
-                                "nominee_text": "passage_chunk"
-                            }
-                        }
-                    }
-                ]
-            }
-            self.opensearch.opensearch_client.ingest.put_pipeline(id=pipeline_id, body=pipeline_body)
-            print(f"Ingest pipeline '{pipeline_id}' created successfully.")
-        except Exception as e:
-            print(f"Error checking or creating ingest pipeline: {e}")
-
-
-    def process_and_ingest_data(self, file_paths: List[str]):
-        if not self.initialize_clients():
-            print("Failed to initialize clients. Aborting ingestion.")
-            return
-
-        # Create the ingest pipeline
-        self.create_ingest_pipeline()
-
-        all_documents = []
-        for file_path in file_paths:
-            print(f"Processing file: {file_path}")
-            documents = self.process_file(file_path)
-            all_documents.extend(documents)
-        
-        total_documents = len(all_documents)
-        print(f"Total documents to process: {total_documents}")
-        
-        print("Generating embeddings for the documents...")
-        success_count = 0
-        error_count = 0
-        with tqdm(total=total_documents, bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]') as pbar:
-            for doc in all_documents:
-                try:
-                    embedding = self.text_embedding(doc['text'])
-                    if embedding is not None:
-                        doc['embedding'] = embedding
-                        success_count += 1
-                    else:
-                        error_count += 1
-                        print(f"{Fore.RED}Error generating embedding for document: {doc['text'][:50]}...{Style.RESET_ALL}")
-                except Exception as e:
-                    error_count += 1
-                    print(f"{Fore.RED}Error processing document: {str(e)}{Style.RESET_ALL}")
-                pbar.update(1)
-                pbar.set_postfix({'Success': success_count, 'Errors': error_count})
-        
-        print(f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}")
-        print(f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}")
-        
-        if success_count == 0:
-            print(f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}")
-            return
-        
-        print(f"{Fore.YELLOW}Ingesting data into OpenSearch...{Style.RESET_ALL}")
-        actions = []
-        for doc in all_documents:
-            if 'embedding' in doc and doc['embedding'] is not None:
-                action = {
-                    "_op_type": "index",
-                    "_index": self.index_name,
-                    "_source": {
-                        "nominee_text": doc['text'],
-                        "nominee_vector": doc['embedding']
-                    },
-                    "pipeline": 'text-chunking-ingest-pipeline'  # Use "pipeline" instead of "_pipeline"
-                }
-                actions.append(action)
-        
-        success, failed = self.opensearch.bulk_index(actions)
-        print(f"{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
-        print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
-    def ingest_command(self, paths: List[str]):
-        # Main ingestion command
-        # Processes all valid files in the given paths and initiates ingestion
-        all_files = []
-        for path in paths:
-            if os.path.isfile(path):
-                all_files.append(path)
-            elif os.path.isdir(path):
-                for root, dirs, files in os.walk(path):
-                    for file in files:
-                        all_files.append(os.path.join(root, file))
-            else:
-                print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
-        
-        supported_extensions = ['.csv', '.txt', '.pdf']
-        valid_files = [f for f in all_files if any(f.lower().endswith(ext) for ext in supported_extensions)]
-        
-        if not valid_files:
-            print(f"{Fore.RED}No valid files found for ingestion.{Style.RESET_ALL}")
-            return
-        
-        print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
-        
-        self.process_and_ingest_data(valid_files)
\ No newline at end of file
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
index 60bd55f3..3215273c 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
@@ -141,16 +141,6 @@ def save_model_id(self, config, save_config_method, model_id):
         save_config_method(config)
 
     def get_custom_model_details(self, default_input):
-        """
-        Prompt the user to enter custom model details or use default.
-        Returns a dictionary with the model details.
-
-        Args:
-            default_input (dict): Default model configuration.
-
-        Returns:
-            dict or None: Custom or default model configuration, or None if invalid input.
-        """
         print("\nDo you want to use the default configuration or provide custom model settings?")
         print("1. Use default configuration")
         print("2. Provide custom model settings")
@@ -167,8 +157,8 @@ def get_custom_model_details(self, default_input):
                 custom_details = json.loads(json_input)
                 return custom_details
             except json.JSONDecodeError as e:
-                print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
+                print(f"Invalid JSON input: {e}")
                 return None
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
-            return None
\ No newline at end of file
+            print("Invalid choice. Aborting model registration.")
+            return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
similarity index 100%
rename from opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CustomPyTorchModel.py
rename to opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
index bd42276b..ea6600fc 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -1,4 +1,3 @@
-# ModelRegister.py
 # SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
@@ -37,7 +36,7 @@
 from ml_models.OpenAIModel import OpenAIModel
 from ml_models.CohereModel import CohereModel
 from ml_models.HuggingFaceModel import HuggingFaceModel
-from ml_models.CustomPyTorchModel import CustomPyTorchModel
+from ml_models.PyTorchModel import CustomPyTorchModel
 import sys
 
 init(autoreset=True)
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 3e3ec1d8..59433193 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -172,4 +172,27 @@ def check_connection(self):
             return True
         except Exception as e:
             print(f"Error connecting to OpenSearch: {e}")
-            return False
\ No newline at end of file
+            return False
+        
+
+    def search_by_vector(self, vector, k=5):
+        try:
+            response = self.opensearch_client.search(
+                index=self.index_name,
+                body={
+                    "size": k,
+                    "_source": ["nominee_text", "passage_chunk"],
+                    "query": {
+                        "knn": {
+                            "nominee_vector": {
+                                "vector": vector,
+                                "k": k
+                            }
+                        }
+                    }
+                }
+            )
+            return response['hits']['hits']
+        except Exception as e:
+            print(f"Error during search: {e}")
+            return []
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index d1092203..45f5e175 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -29,6 +29,9 @@
 import requests
 import os
 import urllib3
+import boto3
+import time
+import tiktoken
 
 urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
 
@@ -41,6 +44,20 @@ def __init__(self, config):
         self.index_name = config.get('index_name')
         self.opensearch = OpenSearchConnector(config)
         self.embedding_model_id = config.get('embedding_model_id')
+        self.llm_model_id = config.get('llm_model_id')  # Get the LLM model ID from config
+        self.aws_region = config.get('region')
+        self.bedrock_client = None
+
+        # Initialize the default search method from config
+        self.default_search_method = self.config.get('default_search_method', 'neural')
+
+        # Load LLM configurations from config
+        self.llm_config = {
+            "maxTokenCount": int(config.get('llm_max_token_count', '1000')),
+            "temperature": float(config.get('llm_temperature', '0.7')),
+            "topP": float(config.get('llm_top_p', '0.9')),
+            "stopSequences": [s.strip() for s in config.get('llm_stop_sequences', '').split(',') if s.strip()]
+        }
 
         # Initialize OpenSearch client
         if not self.initialize_clients():
@@ -53,17 +70,52 @@ def __init__(self, config):
             return
 
     def initialize_clients(self):
-        # Initialize OpenSearch client only
+        # Initialize OpenSearch client and Bedrock client if needed
         if self.opensearch.initialize_opensearch_client():
             print("OpenSearch client initialized successfully.")
+            # Initialize Bedrock client only if needed
+            if self.llm_model_id:
+                try:
+                    self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+                    print("Bedrock client initialized successfully.")
+                except Exception as e:
+                    print(f"Failed to initialize Bedrock client: {e}")
+                    return False
             return True
         else:
             print("Failed to initialize OpenSearch client.")
             return False
 
-    def bulk_query(self, queries, k=5):
-        print("Performing bulk semantic search...")
+    def extract_relevant_sentences(self, query, text):
+        # Lowercase and remove punctuation from query
+        query_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in query)
+        query_words = set(query_processed.split())
+
+        # Split text into sentences based on punctuation and newlines
+        import re
+        sentences = re.split(r'[\n.!?]+', text)
+
+        sentence_scores = []
+        for sentence in sentences:
+            sentence = sentence.strip()
+            if not sentence:
+                continue
+            # Lowercase and remove punctuation from sentence
+            sentence_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in sentence)
+            sentence_words = set(sentence_processed.split())
+            common_words = query_words.intersection(sentence_words)
+            score = len(common_words) / (len(query_words) + 1e-6)  # Normalized score
+            if score > 0:
+                sentence_scores.append((score, sentence))
+
+        # Sort sentences by score in descending order
+        sentence_scores.sort(reverse=True)
+
+        # Return the sentences with highest scores
+        top_sentences = [sentence for score, sentence in sentence_scores]
+        return top_sentences
 
+    def bulk_query_neural(self, queries, k=5):
         results = []
         for query_text in queries:
             try:
@@ -99,56 +151,210 @@ def bulk_query(self, queries, k=5):
 
         return results
 
+    def bulk_query_semantic(self, queries, k=5):
+        # Generate embeddings for queries and search OpenSearch index
+        # Returns a list of results containing query, context, and number of results
+        query_vectors = []
+        for query in queries:
+            embedding = self.text_embedding(query)
+            if embedding:
+                query_vectors.append(embedding)
+            else:
+                print(f"{Fore.RED}Failed to generate embedding for query: {query}{Style.RESET_ALL}")
+                query_vectors.append(None)
 
-    def extract_relevant_sentences(self, query, text):
-        # Lowercase and remove punctuation from query
-        query_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in query)
-        query_words = set(query_processed.split())
+        results = []
+        for i, vector in enumerate(query_vectors):
+            if vector is None:
+                results.append({
+                    'query': queries[i],
+                    'context': "",
+                    'num_results': 0
+                })
+                continue
+            try:
+                hits = self.opensearch.search_by_vector(vector, k)
+                context = '\n'.join([hit['_source']['nominee_text'] for hit in hits])
+                results.append({
+                    'query': queries[i],
+                    'context': context,
+                    'num_results': len(hits)
+                })
+            except Exception as ex:
+                print(f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}")
+                results.append({
+                    'query': queries[i],
+                    'context': "",
+                    'num_results': 0
+                })
+        return results
 
-        # Split text into sentences based on punctuation and newlines
-        import re
-        sentences = re.split(r'[\n.!?]+', text)
+    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        if self.opensearch.opensearch_client is None:
+            print("OpenSearch client is not initialized. Please run setup first.")
+            return None
 
-        sentence_scores = []
-        for sentence in sentences:
-            sentence = sentence.strip()
-            if not sentence:
-                continue
-            # Lowercase and remove punctuation from sentence
-            sentence_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in sentence)
-            sentence_words = set(sentence_processed.split())
-            common_words = query_words.intersection(sentence_words)
-            score = len(common_words) / (len(query_words) + 1e-6)  # Normalized score
-            if score > 0:
-                sentence_scores.append((score, sentence))
+        delay = initial_delay
+        for attempt in range(max_retries):
+            try:
+                payload = {
+                    "text_docs": [text]
+                }
+                response = self.opensearch.opensearch_client.transport.perform_request(
+                    method="POST",
+                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
+                    body=payload
+                )
+                inference_results = response.get('inference_results', [])
+                if not inference_results:
+                    print(f"No inference results returned for text: {text}")
+                    return None
+                output = inference_results[0].get('output')
 
-        # Sort sentences by score in descending order
-        sentence_scores.sort(reverse=True)
+                # Adjust the extraction of embedding data
+                if isinstance(output, list) and len(output) > 0:
+                    embedding_dict = output[0]
+                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
+                        embedding = embedding_dict['data']
+                    else:
+                        print(f"Unexpected embedding output format: {output}")
+                        return None
+                elif isinstance(output, dict) and 'data' in output:
+                    embedding = output['data']
+                else:
+                    print(f"Unexpected embedding output format: {output}")
+                    return None
+
+                # Verify that embedding is a list of floats
+                if not isinstance(embedding, list) or not all(isinstance(x, (float, int)) for x in embedding):
+                    print(f"Embedding is not a list of floats: {embedding}")
+                    return None
+
+                return embedding
+            except Exception as ex:
+                print(f"Error on attempt {attempt + 1}: {ex}")
+                if attempt == max_retries - 1:
+                    raise
+                time.sleep(delay)
+                delay *= backoff_factor
+        return None
+
+    def generate_answer(self, prompt, llm_config):
+        # Generate an answer using the LLM model
+        # Handles token limit and configures LLM parameters
+        # Returns the generated answer or None if an error occurs
+        try:
+            max_input_tokens = 8192  # Max tokens for the model
+            expected_output_tokens = llm_config.get('maxTokenCount', 1000)
+            # Adjust the encoding based on the model
+            encoding = tiktoken.get_encoding("cl100k_base")  # Use appropriate encoding
+
+            prompt_tokens = encoding.encode(prompt)
+            allowable_input_tokens = max_input_tokens - expected_output_tokens
+
+            if len(prompt_tokens) > allowable_input_tokens:
+                # Truncate the prompt to fit within the model's token limit
+                prompt_tokens = prompt_tokens[:allowable_input_tokens]
+                prompt = encoding.decode(prompt_tokens)
+                print(f"Prompt truncated to {allowable_input_tokens} tokens.")
+
+            # Simplified LLM config with only supported parameters
+            llm_config = {
+                'maxTokenCount': expected_output_tokens,
+                'temperature': llm_config.get('temperature', 0.7),
+                'topP': llm_config.get('topP', 1.0),
+                'stopSequences': llm_config.get('stopSequences', [])
+            }
+
+            body = json.dumps({
+                'inputText': prompt,
+                'textGenerationConfig': llm_config
+            })
+            response = self.bedrock_client.invoke_model(modelId=self.llm_model_id, body=body)
+            response_body = json.loads(response['body'].read())
+            results = response_body.get('results', [])
+            if not results:
+                print("No results returned from LLM.")
+                return None
+            answer = results[0].get('outputText', '').strip()
+            return answer
+        except Exception as ex:
+            print(f"Error generating answer from LLM: {ex}")
+            return None
 
-        # Return the sentences with highest scores
-        top_sentences = [sentence for score, sentence in sentence_scores]
-        return top_sentences
     def query_command(self, queries: List[str], num_results=5):
-        results = self.bulk_query(queries, k=num_results)
-
-        for result in results:
-            print(f"\nQuery: {result['query']}")
-            if result['documents']:
-                all_relevant_sentences = []
-                for doc in result['documents']:
-                    passage_chunks = doc['source'].get('passage_chunk', [])
-                    if not passage_chunks:
+        search_method = self.default_search_method
+
+        print(f"\nUsing the default search method: {search_method.capitalize()} Search")
+
+        # Keep the session active until the user types 'exit' or presses Enter without input
+        while True:
+            if not queries:
+                query_text = input("\nEnter a query (or type 'exit' to finish): ").strip()
+                if not query_text or query_text.lower() == 'exit':
+                    print("\nExiting query session.")
+                    break
+                queries = [query_text]
+
+            if search_method == 'neural':
+                # Proceed with neural search
+                results = self.bulk_query_neural(queries, k=num_results)
+
+                for result in results:
+                    print(f"\nQuery: {result['query']}")
+                    if result['documents']:
+                        all_relevant_sentences = []
+                        for doc in result['documents']:
+                            passage_chunks = doc['source'].get('passage_chunk', [])
+                            if not passage_chunks:
+                                continue
+                            for passage in passage_chunks:
+                                relevant_sentences = self.extract_relevant_sentences(result['query'], passage)
+                                all_relevant_sentences.extend(relevant_sentences)
+
+                        if all_relevant_sentences:
+                            # Output the top relevant sentences
+                            print("\nAnswer:")
+                            for sentence in all_relevant_sentences[:1]:  # Display the top sentence
+                                print(sentence)
+                        else:
+                            print("\nNo relevant sentences found.")
+                    else:
+                        print("\nNo documents found for this query.")
+            elif search_method == 'semantic':
+                # Proceed with semantic search
+                if not self.bedrock_client or not self.llm_model_id:
+                    print(f"\n{Fore.RED}LLM model is not configured. Please run setup to select an LLM model.{Style.RESET_ALL}")
+                    return
+
+                # Use the LLM configurations from setup
+                llm_config = self.llm_config
+
+                results = self.bulk_query_semantic(queries, k=num_results)
+
+                for result in results:
+                    print(f"\nQuery: {result['query']}")
+                    print(f"Found {result['num_results']} results.")
+
+                    if not result['context']:
+                        print(f"\n{Fore.RED}No context available for this query.{Style.RESET_ALL}")
                         continue
-                    for passage in passage_chunks:
-                        relevant_sentences = self.extract_relevant_sentences(result['query'], passage)
-                        all_relevant_sentences.extend(relevant_sentences)
-
-                if all_relevant_sentences:
-                    # Output the top relevant sentences
-                    print("Answer:")
-                    for sentence in all_relevant_sentences[:1]:  # Display the top sentence
-                        print(sentence)
-                else:
-                    print("No relevant sentences found.")
-            else:
-                print("No documents found for this query.")
\ No newline at end of file
+
+                    augmented_prompt = f"""Context: {result['context']}
+Based on the above context, please provide a detailed and insightful answer to the following question. Feel free to make reasonable inferences or connections if the context doesn't provide all the information:
+
+Question: {result['query']}
+
+Answer:"""
+
+                    print("\nGenerating answer using LLM...")
+                    answer = self.generate_answer(augmented_prompt, llm_config)
+
+                    if answer:
+                        print("\nGenerated Answer:")
+                        print(answer)
+                    else:
+                        print("\nFailed to generate an answer.")
+
+            # After processing, reset queries to allow for the next input
+            queries = []
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 03577be0..623a4922 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -2,22 +2,25 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors.
-# See GitHub history for details.
-# Licensed to Elasticsearch B.V. under one or more contributor
-# license agreements. See the NOTICE file distributed with
-# this work for additional information regarding copyright
-# ownership. Elasticsearch B.V. licenses this file to you under
-# the Apache License, Version 2.0 (the "License"); you may
-# not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-# http://www.apache.org/licenses/LICENSE-2.0
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied. See the License for the
-# specific language governing permissions and limitations
-# under the License.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
 
 import boto3
 import botocore
@@ -32,11 +35,13 @@
 import sys
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
-from AIConnectorHelper import AIConnectorHelper
-from model_register import ModelRegister
 from colorama import Fore, Style, init
 import ssl
 
+from serverless import Serverless  
+from AIConnectorHelper import AIConnectorHelper 
+from model_register import ModelRegister
+
 init(autoreset=True)
 
 class Setup:
@@ -47,8 +52,8 @@ class Setup:
     def __init__(self):
         # Initialize setup variables
         self.config = self.load_config()
-        self.aws_region = self.config.get('region')
-        self.iam_principal = self.config.get('iam_principal')
+        self.aws_region = self.config.get('region', 'us-west-2')
+        self.iam_principal = self.config.get('iam_principal', '')
         self.collection_name = self.config.get('collection_name', '')
         self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
         self.service_type = self.config.get('service_type', 'managed')
@@ -60,15 +65,18 @@ def __init__(self):
         self.opensearch_client = None
         self.opensearch_domain_name = self.get_opensearch_domain_name()
         self.model_register = None
+        self.serverless = None  # Will be initialized if service_type is 'serverless'
 
     def check_and_configure_aws(self):
-        # Check if AWS credentials are configured and offer to reconfigure if needed
+        """
+        Check if AWS credentials are configured and offer to reconfigure if needed.
+        """
         try:
             session = boto3.Session()
             credentials = session.get_credentials()
 
             if credentials is None:
-                print("AWS credentials are not configured.")
+                print(f"{Fore.YELLOW}AWS credentials are not configured.{Style.RESET_ALL}")
                 self.configure_aws()
             else:
                 print("AWS credentials are already configured.")
@@ -76,16 +84,18 @@ def check_and_configure_aws(self):
                 if reconfigure == 'yes':
                     self.configure_aws()
         except Exception as e:
-            print(f"An error occurred while checking AWS credentials: {e}")
+            print(f"{Fore.RED}An error occurred while checking AWS credentials: {e}{Style.RESET_ALL}")
             self.configure_aws()
 
     def configure_aws(self):
-        # Configure AWS credentials using user input
+        """
+        Configure AWS credentials using user input.
+        """
         print("Let's configure your AWS credentials.")
 
-        aws_access_key_id = input("Enter your AWS Access Key ID: ")
-        aws_secret_access_key = input("Enter your AWS Secret Access Key: ")
-        aws_region_input = input("Enter your preferred AWS region (e.g., us-west-2): ")
+        aws_access_key_id = input("Enter your AWS Access Key ID: ").strip()
+        aws_secret_access_key = input("Enter your AWS Secret Access Key: ").strip()
+        aws_region_input = input("Enter your preferred AWS region (e.g., us-west-2): ").strip()
 
         try:
             subprocess.run([
@@ -103,30 +113,31 @@ def configure_aws(self):
                 'region', aws_region_input
             ], check=True)
             
-            print("AWS credentials have been successfully configured.")
+            print(f"{Fore.GREEN}AWS credentials have been successfully configured.{Style.RESET_ALL}")
         except subprocess.CalledProcessError as e:
-            print(f"An error occurred while configuring AWS credentials: {e}")
+            print(f"{Fore.RED}An error occurred while configuring AWS credentials: {e}{Style.RESET_ALL}")
         except Exception as e:
-            print(f"An unexpected error occurred: {e}")
+            print(f"{Fore.RED}An unexpected error occurred: {e}{Style.RESET_ALL}")
 
     def load_config(self):
-        # Load configuration from the config file
+        """
+        Load configuration from the config file.
+
+        :return: Dictionary of configuration parameters
+        """
         config = configparser.ConfigParser()
         if os.path.exists(self.CONFIG_FILE):
             config.read(self.CONFIG_FILE)
             return dict(config['DEFAULT'])
         return {}
 
-    def save_config(self, config):
-        # Save configuration to the config file
-        parser = configparser.ConfigParser()
-        parser['DEFAULT'] = config
-        with open(self.CONFIG_FILE, 'w') as f:
-            parser.write(f)
-
     def get_password_with_asterisks(self, prompt="Enter password: "):
-        # Get password input from user, masking it with asterisks
-        import sys
+        """
+        Get password input from user, masking it with asterisks.
+
+        :param prompt: Prompt message
+        :return: Entered password as a string
+        """
         if sys.platform == 'win32':
             import msvcrt
             print(prompt, end='', flush=True)
@@ -172,15 +183,19 @@ def get_password_with_asterisks(self, prompt="Enter password: "):
                 termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
 
     def setup_configuration(self):
-        # Set up the configuration by prompting the user for various settings
+        """
+        Set up the configuration by prompting the user for various settings.
+        """
         config = self.load_config()
 
+        print("\nStarting setup process...")
+
         # First, prompt for service type
-        print("Choose OpenSearch service type:")
+        print("\nChoose OpenSearch service type:")
         print("1. Serverless")
         print("2. Managed")
         print("3. Open-source")
-        service_choice = input("Enter your choice (1-3): ")
+        service_choice = input("Enter your choice (1-3): ").strip()
 
         if service_choice == '1':
             self.service_type = 'serverless'
@@ -189,7 +204,7 @@ def setup_configuration(self):
         elif service_choice == '3':
             self.service_type = 'open-source'
         else:
-            print("Invalid choice. Defaulting to 'managed'")
+            print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'managed'.{Style.RESET_ALL}")
             self.service_type = 'managed'
 
         # Based on service type, prompt for different configurations
@@ -197,27 +212,27 @@ def setup_configuration(self):
             # For 'serverless' and 'managed', prompt for AWS credentials and related info
             self.check_and_configure_aws()
 
-            self.aws_region = input(f"Enter your AWS Region [{config.get('region', 'us-west-2')}]: ") or config.get('region', 'us-west-2')
-            self.iam_principal = input(f"Enter your IAM Principal ARN [{config.get('iam_principal', '')}]: ") or config.get('iam_principal', '')
+            self.aws_region = input(f"\nEnter your AWS Region [{self.aws_region}]: ").strip() or self.aws_region
+            self.iam_principal = input(f"Enter your IAM Principal ARN [{self.iam_principal}]: ").strip() or self.iam_principal
 
             if self.service_type == 'serverless':
-                self.collection_name = input("Enter the name for your OpenSearch collection: ")
+                self.collection_name = input("\nEnter the name for your OpenSearch collection: ").strip()
                 self.opensearch_endpoint = None
                 self.opensearch_username = None
                 self.opensearch_password = None
             elif self.service_type == 'managed':
-                self.opensearch_endpoint = input("Enter your OpenSearch domain endpoint: ")
-                self.opensearch_username = input("Enter your OpenSearch username: ")
+                self.opensearch_endpoint = input("\nEnter your OpenSearch domain endpoint: ").strip()
+                self.opensearch_username = input("Enter your OpenSearch username: ").strip()
                 self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
                 self.collection_name = ''
         elif self.service_type == 'open-source':
             # For 'open-source', skip AWS configurations
             print("\n--- Open-source OpenSearch Setup ---")
             default_endpoint = 'https://localhost:9200'
-            self.opensearch_endpoint = input(f"Press Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
+            self.opensearch_endpoint = input(f"\nPress Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
             auth_required = input("Does your OpenSearch instance require authentication? (yes/no): ").strip().lower()
             if auth_required == 'yes':
-                self.opensearch_username = input("Enter your OpenSearch username: ")
+                self.opensearch_username = input("Enter your OpenSearch username: ").strip()
                 self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
             else:
                 self.opensearch_username = None
@@ -237,11 +252,96 @@ def setup_configuration(self):
             'opensearch_username': self.opensearch_username if self.opensearch_username else '',
             'opensearch_password': self.opensearch_password if self.opensearch_password else ''
         }
+
+        # Now, prompt for default search method
+        print("\nChoose the default search method:")
+        print("1. Neural Search")
+        print("2. Semantic Search")
+        search_choice = input("Enter your choice (1-2): ").strip()
+
+        if search_choice == '1':
+            default_search_method = 'neural'
+        elif search_choice == '2':
+            default_search_method = 'semantic'
+        else:
+            print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'neural'.{Style.RESET_ALL}")
+            default_search_method = 'neural'
+
+        self.config['default_search_method'] = default_search_method
+
+        if default_search_method == 'semantic':
+            # Prompt the user to select an LLM model for semantic search
+            print("\nSelect an LLM model for semantic search:")
+            available_models = [
+                ("amazon.titan-text-lite-v1", "Bedrock Titan Text Lite V1"),
+                ("amazon.titan-text-express-v1", "Bedrock Titan Text Express V1"),
+                ("anthropic.claude-3-5-sonnet-20240620-v1:0", "Anthropic Claude 3.5 Sonnet"),
+                ("anthropic.claude-3-opus-20240229-v1:0", "Anthropic Claude 3 Opus"),
+                ("cohere.command-r-plus-v1:0", "Cohere Command R Plus V1"),
+                ("cohere.command-r-v1:0", "Cohere Command R V1")
+            ]
+            for idx, (model_id, model_name) in enumerate(available_models, start=1):
+                print(f"{idx}. {model_name} ({model_id})")
+            model_choice = input(f"\nEnter the number of your chosen model (1-{len(available_models)}): ").strip()
+            try:
+                model_choice_idx = int(model_choice) - 1
+                if 0 <= model_choice_idx < len(available_models):
+                    selected_model_id = available_models[model_choice_idx][0]
+                    self.config['llm_model_id'] = selected_model_id
+                    print(f"\nSelected LLM Model ID: {selected_model_id}")
+                else:
+                    print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}")
+                    self.config['llm_model_id'] = available_models[0][0]
+            except ValueError:
+                print(f"\n{Fore.YELLOW}Invalid input. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}")
+                self.config['llm_model_id'] = available_models[0][0]
+
+            # Prompt for LLM configurations
+            print("\nConfigure LLM settings:")
+            try:
+                maxTokenCount = int(input("Enter max token count [1000]: ").strip() or "1000")
+            except ValueError:
+                maxTokenCount = 1000
+            try:
+                temperature = float(input("Enter temperature [0.7]: ").strip() or "0.7")
+            except ValueError:
+                temperature = 0.7
+            try:
+                topP = float(input("Enter topP [0.9]: ").strip() or "0.9")
+            except ValueError:
+                topP = 0.9
+            stopSequences_input = input("Enter stop sequences (comma-separated) or press Enter for none: ").strip()
+            if stopSequences_input:
+                stopSequences = [s.strip() for s in stopSequences_input.split(',')]
+            else:
+                stopSequences = []
+
+            # Save LLM configurations to config
+            self.config['llm_max_token_count'] = str(maxTokenCount)
+            self.config['llm_temperature'] = str(temperature)
+            self.config['llm_top_p'] = str(topP)
+            self.config['llm_stop_sequences'] = ','.join(stopSequences)
+
+        # Prompt for ingest pipeline name
+        default_pipeline_name = 'text-chunking-ingest-pipeline'
+        pipeline_name = input(f"\nEnter the name of the ingest pipeline to use [{default_pipeline_name}]: ").strip()
+        if not pipeline_name:
+            pipeline_name = default_pipeline_name
+
+        # Save the pipeline name to config
+        self.config['ingest_pipeline_name'] = pipeline_name
+
+        # Save the configuration
         self.save_config(self.config)
-        print("Configuration saved successfully.\n")
+        print(f"\n{Fore.GREEN}Configuration saved successfully to {os.path.abspath(self.CONFIG_FILE)}.{Style.RESET_ALL}\n")
+
 
     def initialize_clients(self):
-        # Initialize AWS clients (AOSS and Bedrock) only if not open-source
+        """
+        Initialize AWS clients (AOSS and Bedrock) only if not open-source.
+
+        :return: True if clients initialized successfully or open-source, False otherwise
+        """
         if self.service_type == 'open-source':
             return True  # No AWS clients needed
 
@@ -255,103 +355,18 @@ def initialize_clients(self):
                 self.aoss_client = boto3.client(self.SERVICE_AOSS, config=boto_config)
             self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region)
             
-            time.sleep(7)
-            print("AWS clients initialized successfully.\n")
+            time.sleep(7)  # Wait for clients to initialize
+            print(f"{Fore.GREEN}AWS clients initialized successfully.{Style.RESET_ALL}\n")
             return True
         except Exception as e:
-            print(f"Failed to initialize AWS clients: {e}")
+            print(f"{Fore.RED}Failed to initialize AWS clients: {e}{Style.RESET_ALL}")
             return False
 
-    def create_security_policies(self):
-        # Create security policies for serverless OpenSearch
-        if not self.is_serverless:
-            print("Security policies are not applicable for managed OpenSearch domains.\n")
-            return
-        
-        encryption_policy = json.dumps({
-            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
-            "AWSOwnedKey": True
-        })
-        
-        network_policy = json.dumps([{
-            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
-            "AllowFromPublic": True
-        }])
-        
-        data_access_policy = json.dumps([{
-            "Rules": [
-                {"Resource": ["collection/*"], "Permission": ["aoss:*"], "ResourceType": "collection"},
-                {"Resource": ["index/*/*"], "Permission": ["aoss:*"], "ResourceType": "index"}
-            ],
-            "Principal": [self.iam_principal],
-            "Description": f"Data access policy for {self.collection_name}"
-        }])
-        
-        encryption_policy_name = self.get_truncated_name(f"{self.collection_name}-enc-policy")
-        self.create_security_policy("encryption", encryption_policy_name, f"{self.collection_name} encryption security policy", encryption_policy)
-        self.create_security_policy("network", f"{self.collection_name}-net-policy", f"{self.collection_name} network security policy", network_policy)
-        self.create_access_policy(self.get_truncated_name(f"{self.collection_name}-access-policy"), f"{self.collection_name} data access policy", data_access_policy)
-
-    def create_security_policy(self, policy_type, name, description, policy_body):
-        # Create a specific security policy (encryption or network)
-        try:
-            if policy_type.lower() == "encryption":
-                self.aoss_client.create_security_policy(description=description, name=name, policy=policy_body, type="encryption")
-            elif policy_type.lower() == "network":
-                self.aoss_client.create_security_policy(description=description, name=name, policy=policy_body, type="network")
-            else:
-                raise ValueError("Invalid policy type specified.")
-            print(f"{policy_type.capitalize()} Policy '{name}' created successfully.")
-        except self.aoss_client.exceptions.ConflictException:
-            print(f"{policy_type.capitalize()} Policy '{name}' already exists.")
-        except Exception as ex:
-            print(f"Error creating {policy_type} policy '{name}': {ex}")
-
-    def create_access_policy(self, name, description, policy_body):
-        # Create a data access policy
-        try:
-            self.aoss_client.create_access_policy(description=description, name=name, policy=policy_body, type="data")
-            print(f"Data Access Policy '{name}' created successfully.\n")
-        except self.aoss_client.exceptions.ConflictException:
-            print(f"Data Access Policy '{name}' already exists.\n")
-        except Exception as ex:
-            print(f"Error creating data access policy '{name}': {ex}\n")
-
-    def create_collection(self, collection_name, max_retries=3):
-        # Create an OpenSearch serverless collection
-        for attempt in range(max_retries):
-            try:
-                response = self.aoss_client.create_collection(
-                    description=f"{collection_name} collection",
-                    name=collection_name,
-                    type="VECTORSEARCH"
-                )
-                print(f"Collection '{collection_name}' creation initiated.")
-                return response['createCollectionDetail']['id']
-            except self.aoss_client.exceptions.ConflictException:
-                print(f"Collection '{collection_name}' already exists.")
-                return self.get_collection_id(collection_name)
-            except Exception as ex:
-                print(f"Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}")
-                if attempt == max_retries - 1:
-                    return None
-                time.sleep(5)
-        return None
-
-    def get_collection_id(self, collection_name):
-        # Retrieve the ID of an existing collection
-        try:
-            response = self.aoss_client.list_collections()
-            for collection in response['collectionSummaries']:
-                if collection['name'] == collection_name:
-                    return collection['id']
-        except Exception as ex:
-            print(f"Error getting collection ID: {ex}")
-        return None
-
     def get_opensearch_domain_name(self):
         """
         Extract the domain name from the OpenSearch endpoint URL.
+
+        :return: Domain name if extraction is successful, None otherwise
         """
         if self.opensearch_endpoint:
             parsed_url = urlparse(self.opensearch_endpoint)
@@ -373,6 +388,10 @@ def get_opensearch_domain_name(self):
     def get_opensearch_domain_info(region, domain_name):
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
+
+        :param region: AWS region
+        :param domain_name: Name of the OpenSearch domain
+        :return: Tuple of (domain_endpoint, domain_arn) if successful, (None, None) otherwise
         """
         try:
             client = boto3.client('opensearch', region_name=region)
@@ -382,94 +401,39 @@ def get_opensearch_domain_info(region, domain_name):
             domain_arn = domain_status['ARN']
             return domain_endpoint, domain_arn
         except Exception as e:
-            print(f"Error retrieving OpenSearch domain info: {e}")
+            print(f"{Fore.RED}Error retrieving OpenSearch domain info: {e}{Style.RESET_ALL}")
             return None, None
 
-    def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
-        # Wait for the collection to become active
-        print(f"Waiting for collection '{self.collection_name}' to become active...")
-        start_time = time.time()
-        while time.time() - start_time < max_wait_minutes * 60:
-            try:
-                response = self.aoss_client.batch_get_collection(ids=[collection_id])
-                status = response['collectionDetails'][0]['status']
-                if status == 'ACTIVE':
-                    print(f"Collection '{self.collection_name}' is now active.\n")
-                    return True
-                elif status in ['FAILED', 'DELETED']:
-                    print(f"Collection creation failed or was deleted. Status: {status}\n")
-                    return False
-                else:
-                    print(f"Collection status: {status}. Waiting...")
-                    time.sleep(30)
-            except Exception as ex:
-                print(f"Error checking collection status: {ex}")
-                time.sleep(30)
-        print(f"Timed out waiting for collection to become active after {max_wait_minutes} minutes.\n")
-        return False
-
-    def get_collection_endpoint(self):
-        # Retrieve the endpoint URL for the OpenSearch collection
-        if not self.is_serverless:
-            return self.opensearch_endpoint
-        
-        try:
-            collection_id = self.get_collection_id(self.collection_name)
-            if not collection_id:
-                print(f"Collection '{self.collection_name}' not found.\n")
-                return None
-            
-            batch_get_response = self.aoss_client.batch_get_collection(ids=[collection_id])
-            collection_details = batch_get_response.get('collectionDetails', [])
-            
-            if not collection_details:
-                print(f"No details found for collection ID '{collection_id}'.\n")
-                return None
-            
-            self.opensearch_endpoint = collection_details[0].get('collectionEndpoint')
-            if self.opensearch_endpoint:
-                print(f"Collection '{self.collection_name}' has endpoint URL: {self.opensearch_endpoint}\n")
-                return self.opensearch_endpoint
-            else:
-                print(f"No endpoint URL found in collection '{self.collection_name}'.\n")
-                return None
-        except Exception as ex:
-            print(f"Error retrieving collection endpoint: {ex}\n")
-            return None
-
-    def get_iam_user_name_from_arn(self, iam_principal_arn):
-        """
-        Extract the IAM user name from the IAM principal ARN.
-        """
-        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
-        if iam_principal_arn and ':user/' in iam_principal_arn:
-            return iam_principal_arn.split(':user/')[-1]
-        else:
-            return None
-
     def initialize_opensearch_client(self):
-        # Initialize the OpenSearch client
         if not self.opensearch_endpoint:
-            print("OpenSearch endpoint not set. Please run setup first.\n")
+            print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
             return False
 
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
         port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
-        if self.service_type in ['managed', 'serverless']:
+        if self.service_type == 'serverless':
             credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss') if self.is_serverless else AWSV4SignerAuth(credentials, self.aws_region, 'es')
-        else:
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+        elif self.service_type == 'managed':
             if not self.opensearch_username or not self.opensearch_password:
-                print("OpenSearch username or password not set. Please run setup first.\n")
+                print(f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n")
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
+        elif self.service_type == 'open-source':
+            if self.opensearch_username and self.opensearch_password:
+                auth = (self.opensearch_username, self.opensearch_password)
+            else:
+                auth = None  # No authentication
+        else:
+            print("Invalid service type. Please check your configuration.")
+            return False
 
         use_ssl = parsed_url.scheme == 'https'
         verify_certs = False if use_ssl else True
 
-        # Create an SSL context that does not verify certificates
+        # Create an SSL context that does not verify certificates if needed
         if use_ssl and not verify_certs:
             ssl_context = ssl.create_default_context()
             ssl_context.check_hostname = False
@@ -488,17 +452,21 @@ def initialize_opensearch_client(self):
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
-            print(f"Initialized OpenSearch client with host: {host} and port: {port}\n")
+            print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
             return True
         except Exception as ex:
-            print(f"Error initializing OpenSearch client: {ex}\n")
+            print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
             return False
-
+        
     def get_knn_index_details(self):
-        # Prompt user for KNN index details (embedding dimension, space type, and ef_construction)
-        dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ")
+        """
+        Prompt user for KNN index details (embedding dimension, space type, and ef_construction).
+
+        :return: Tuple of (embedding_dimension, space_type, ef_construction)
+        """
+        dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ").strip()
         
-        if dimension_input.strip() == "":
+        if dimension_input == "":
             embedding_dimension = 768
         else:
             try:
@@ -513,7 +481,7 @@ def get_knn_index_details(self):
         print("1. L2 (Euclidean distance)")
         print("2. Cosine similarity")
         print("3. Inner product")
-        space_choice = input("Enter your choice (1-3), or press Enter for default (L2): ")
+        space_choice = input("Enter your choice (1-3), or press Enter for default (L2): ").strip()
 
         if space_choice == "" or space_choice == "1":
             space_type = "l2"
@@ -528,9 +496,9 @@ def get_knn_index_details(self):
         print(f"Space type set to: {space_type}")
 
         # New prompt for ef_construction
-        ef_construction_input = input("\nPress Enter to use the default ef_construction value (512), or type a custom value: ")
+        ef_construction_input = input("\nPress Enter to use the default ef_construction value (512), or type a custom value: ").strip()
         
-        if ef_construction_input.strip() == "":
+        if ef_construction_input == "":
             ef_construction = 512
         else:
             try:
@@ -542,9 +510,27 @@ def get_knn_index_details(self):
         print(f"ef_construction set to: {ef_construction}\n")
 
         return embedding_dimension, space_type, ef_construction
+    def save_config(self, config):
+        """
+        Save configuration to the config file.
 
+        :param config: Dictionary of configuration parameters
+        """
+        parser = configparser.ConfigParser()
+        parser['DEFAULT'] = config
+        config_path = os.path.abspath(self.CONFIG_FILE)
+        with open(self.CONFIG_FILE, 'w') as f:
+            parser.write(f)
+        # Removed duplicate message
+        # Only one message is printed where this method is called
     def create_index(self, embedding_dimension, space_type, ef_construction):
-        # Create the KNN index in OpenSearch
+        """
+        Create the KNN index in OpenSearch.
+
+        :param embedding_dimension: Dimension of the embedding vectors
+        :param space_type: Type of space for KNN
+        :param ef_construction: ef_construction parameter for KNN
+        """
         index_body = {
             "mappings": {
                 "properties": {
@@ -571,112 +557,110 @@ def create_index(self, embedding_dimension, space_type, ef_construction):
         }
         try:
             self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.\n")
+            print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.{Style.RESET_ALL}\n")
         except Exception as e:
             if 'resource_already_exists_exception' in str(e).lower():
-                print(f"Index '{self.index_name}' already exists.\n")
+                print(f"\n{Fore.YELLOW}Index '{self.index_name}' already exists.{Style.RESET_ALL}\n")
             else:
-                print(f"Error creating index '{self.index_name}': {e}\n")
+                print(f"\n{Fore.RED}Error creating index '{self.index_name}': {e}{Style.RESET_ALL}\n")
 
     def verify_and_create_index(self, embedding_dimension, space_type, ef_construction):
+        """
+        Verify if the index exists; if not, create it.
+
+        :param embedding_dimension: Dimension of the embedding vectors
+        :param space_type: Type of space for KNN
+        :param ef_construction: ef_construction parameter for KNN
+        :return: True if index exists or is created successfully, False otherwise
+        """
         try:
             print(f"Attempting to verify index '{self.index_name}'...")
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
-                print(f"KNN index '{self.index_name}' already exists.\n")
+                print(f"{Fore.GREEN}KNN index '{self.index_name}' already exists.{Style.RESET_ALL}\n")
             else:
-                print(f"Index '{self.index_name}' does not exist. Attempting to create...\n")
+                print(f"{Fore.YELLOW}Index '{self.index_name}' does not exist. Attempting to create...{Style.RESET_ALL}\n")
                 self.create_index(embedding_dimension, space_type, ef_construction)
             return True
         except Exception as ex:
-            print(f"Error verifying or creating index: {ex}")
+            print(f"{Fore.RED}Error verifying or creating index: {ex}{Style.RESET_ALL}")
             print(f"OpenSearch client config: {self.opensearch_client.transport.hosts}\n")
             return False
 
     def get_truncated_name(self, base_name, max_length=32):
-        # Truncate a name to fit within a specified length
+        """
+        Truncate a name to fit within a specified length.
+
+        :param base_name: Original name
+        :param max_length: Maximum allowed length
+        :return: Truncated name
+        """
         if len(base_name) <= max_length:
             return base_name
         return base_name[:max_length-3] + "..."
 
     def setup_command(self):
-        # Main setup command
+        """
+        Main setup command that orchestrates the entire setup process.
+        """
         self.setup_configuration()
-        
+
         if self.service_type != 'open-source' and not self.initialize_clients():
-            print(f"{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n")
+            print(f"\n{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n")
             return
-        
+
         if self.service_type == 'serverless':
-            self.create_security_policies()
-            collection_id = self.get_collection_id(self.collection_name)
-            if not collection_id:
-                print(f"{Fore.YELLOW}Collection '{self.collection_name}' not found. Attempting to create it...{Style.RESET_ALL}")
-                collection_id = self.create_collection(self.collection_name)
-            
-            if collection_id:
-                if self.wait_for_collection_active(collection_id):
-                    self.opensearch_endpoint = self.get_collection_endpoint()
-                    if not self.opensearch_endpoint:
-                        print(f"{Fore.RED}Failed to retrieve OpenSearch endpoint. Setup incomplete.{Style.RESET_ALL}\n")
-                        return
-                    else:
-                        self.config['opensearch_endpoint'] = self.opensearch_endpoint
-                        self.save_config(self.config)
-                        self.opensearch_domain_name = self.get_opensearch_domain_name()
-                else:
-                    print(f"{Fore.RED}Collection is not active. Setup incomplete.{Style.RESET_ALL}\n")
-                    return
+
+            pass
         elif self.service_type == 'managed':
             if not self.opensearch_endpoint:
-                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
+                print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
             else:
                 self.opensearch_domain_name = self.get_opensearch_domain_name()
         elif self.service_type == 'open-source':
             # Open-source setup
             if not self.opensearch_endpoint:
-                print(f"{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
+                print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
             else:
                 self.opensearch_domain_name = None  # Not required for open-source
 
         # Initialize OpenSearch client
         if self.initialize_opensearch_client():
-            print(f"{Fore.GREEN}OpenSearch client initialized successfully.{Style.RESET_ALL}\n")
-            
+
             # Prompt user to choose between creating a new index or using an existing one
             print("Do you want to create a new KNN index or use an existing one?")
             print("1. Create a new KNN index")
             print("2. Use an existing KNN index")
             index_choice = input("Enter your choice (1-2): ").strip()
-            
+
             if index_choice == '1':
                 # Proceed to create a new index
-                self.index_name = input("Enter a name for your new KNN index in OpenSearch: ").strip()
-        
+                self.index_name = input("\nEnter a name for your new KNN index in OpenSearch: ").strip()
+
                 # Save the index name in the configuration
                 self.config['index_name'] = self.index_name
                 self.save_config(self.config)
-        
-                print("Proceeding with index creation...\n")
+
+                print("\nProceeding with index creation...\n")
                 embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
-                
+
                 if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
-                    print(f"{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
+                    print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
                     # Save index details to config
                     self.config['embedding_dimension'] = str(embedding_dimension)
                     self.config['space_type'] = space_type
                     self.config['ef_construction'] = str(ef_construction)
                     self.save_config(self.config)
                 else:
-                    print(f"{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
+                    print(f"\n{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
                     return
             elif index_choice == '2':
                 # Use existing index
-                existing_index_name = input("Enter the name of your existing KNN index: ").strip()
+                existing_index_name = input("\nEnter the name of your existing KNN index: ").strip()
                 if not existing_index_name:
-                    print(f"{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n")
+                    print(f"\n{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n")
                     return
                 self.index_name = existing_index_name
                 self.config['index_name'] = self.index_name
@@ -687,9 +671,9 @@ def setup_command(self):
                         embedding_dimension = int(self.config['embedding_dimension'])
                         space_type = self.config['space_type']
                         ef_construction = int(self.config['ef_construction'])
-                        print(f"Using existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.\n")
+                        print(f"\nUsing existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.\n")
                     except ValueError:
-                        print("Invalid index details in configuration. Prompting for details again.\n")
+                        print("\nInvalid index details in configuration. Prompting for details again.\n")
                         embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
                         # Save index details to config
                         self.config['embedding_dimension'] = str(embedding_dimension)
@@ -697,7 +681,7 @@ def setup_command(self):
                         self.config['ef_construction'] = str(ef_construction)
                         self.save_config(self.config)
                 else:
-                    print("Index details not found in configuration. Prompting for details.\n")
+                    print("\nIndex details not found in configuration. Prompting for details.\n")
                     embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
                     # Save index details to config
                     self.config['embedding_dimension'] = str(embedding_dimension)
@@ -706,10 +690,10 @@ def setup_command(self):
                     self.save_config(self.config)
                 # Verify that the index exists
                 if not self.opensearch_client.indices.exists(index=self.index_name):
-                    print(f"{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
+                    print(f"\n{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
                     return
             else:
-                print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}\n")
+                print(f"\n{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}\n")
                 return
 
             # Proceed with model registration
@@ -719,7 +703,7 @@ def setup_command(self):
                 self.opensearch_client,
                 self.opensearch_domain_name
             )
-            
+
             # Model Registration
             if self.service_type != 'open-source':
                 # AWS-managed OpenSearch: Proceed with model registration
@@ -728,4 +712,4 @@ def setup_command(self):
                 # Open-source OpenSearch: Provide instructions or automate model registration
                 self.model_register.prompt_opensource_model_registration()
         else:
-            print(f"{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
\ No newline at end of file
+            print(f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
new file mode 100644
index 00000000..7aa30969
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
@@ -0,0 +1,240 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import boto3
+import botocore
+import json
+import time
+from urllib.parse import urlparse
+from colorama import Fore, Style
+
+class Serverless:
+    def __init__(self, aoss_client, collection_name, iam_principal, aws_region):
+        """
+        Initialize the Serverless class with necessary AWS clients and configuration.
+
+        :param aoss_client: Boto3 client for OpenSearch Serverless
+        :param collection_name: Name of the OpenSearch collection
+        :param iam_principal: IAM Principal ARN
+        :param aws_region: AWS Region
+        """
+        self.aoss_client = aoss_client
+        self.collection_name = collection_name
+        self.iam_principal = iam_principal
+        self.aws_region = aws_region
+
+    def create_security_policies(self):
+        """
+        Create security policies for serverless OpenSearch.
+        """
+        encryption_policy = json.dumps({
+            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
+            "AWSOwnedKey": True
+        })
+        
+        network_policy = json.dumps([{
+            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
+            "AllowFromPublic": True
+        }])
+        
+        data_access_policy = json.dumps([{
+            "Rules": [
+                {"Resource": ["collection/*"], "Permission": ["aoss:*"], "ResourceType": "collection"},
+                {"Resource": ["index/*/*"], "Permission": ["aoss:*"], "ResourceType": "index"}
+            ],
+            "Principal": [self.iam_principal],
+            "Description": f"Data access policy for {self.collection_name}"
+        }])
+        
+        encryption_policy_name = self.get_truncated_name(f"{self.collection_name}-enc-policy")
+        self.create_security_policy("encryption", encryption_policy_name, f"{self.collection_name} encryption security policy", encryption_policy)
+        self.create_security_policy("network", f"{self.collection_name}-net-policy", f"{self.collection_name} network security policy", network_policy)
+        self.create_access_policy(self.get_truncated_name(f"{self.collection_name}-access-policy"), f"{self.collection_name} data access policy", data_access_policy)
+
+    def create_security_policy(self, policy_type, name, description, policy_body):
+        """
+        Create a specific security policy (encryption or network).
+
+        :param policy_type: Type of policy ('encryption' or 'network')
+        :param name: Name of the policy
+        :param description: Description of the policy
+        :param policy_body: JSON string of the policy
+        """
+        try:
+            if policy_type.lower() == "encryption":
+                self.aoss_client.create_security_policy(
+                    description=description,
+                    name=name,
+                    policy=policy_body,
+                    type="encryption"
+                )
+            elif policy_type.lower() == "network":
+                self.aoss_client.create_security_policy(
+                    description=description,
+                    name=name,
+                    policy=policy_body,
+                    type="network"
+                )
+            else:
+                raise ValueError("Invalid policy type specified.")
+            print(f"{Fore.GREEN}{policy_type.capitalize()} Policy '{name}' created successfully.{Style.RESET_ALL}")
+        except self.aoss_client.exceptions.ConflictException:
+            print(f"{Fore.YELLOW}{policy_type.capitalize()} Policy '{name}' already exists.{Style.RESET_ALL}")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating {policy_type} policy '{name}': {ex}{Style.RESET_ALL}")
+
+    def create_access_policy(self, name, description, policy_body):
+        """
+        Create a data access policy.
+
+        :param name: Name of the access policy
+        :param description: Description of the access policy
+        :param policy_body: JSON string of the access policy
+        """
+        try:
+            self.aoss_client.create_access_policy(
+                description=description,
+                name=name,
+                policy=policy_body,
+                type="data"
+            )
+            print(f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n")
+        except self.aoss_client.exceptions.ConflictException:
+            print(f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n")
+        except Exception as ex:
+            print(f"{Fore.RED}Error creating data access policy '{name}': {ex}{Style.RESET_ALL}\n")
+
+    def create_collection(self, collection_name, max_retries=3):
+        """
+        Create an OpenSearch serverless collection.
+
+        :param collection_name: Name of the collection to create
+        :param max_retries: Maximum number of retries for creation
+        :return: Collection ID if successful, None otherwise
+        """
+        for attempt in range(max_retries):
+            try:
+                response = self.aoss_client.create_collection(
+                    description=f"{collection_name} collection",
+                    name=collection_name,
+                    type="VECTORSEARCH"
+                )
+                print(f"{Fore.GREEN}Collection '{collection_name}' creation initiated.{Style.RESET_ALL}")
+                return response['createCollectionDetail']['id']
+            except self.aoss_client.exceptions.ConflictException:
+                print(f"{Fore.YELLOW}Collection '{collection_name}' already exists.{Style.RESET_ALL}")
+                return self.get_collection_id(collection_name)
+            except Exception as ex:
+                print(f"{Fore.RED}Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}{Style.RESET_ALL}")
+                if attempt == max_retries - 1:
+                    return None
+                time.sleep(5)
+        return None
+
+    def get_collection_id(self, collection_name):
+        """
+        Retrieve the ID of an existing collection.
+
+        :param collection_name: Name of the collection
+        :return: Collection ID if found, None otherwise
+        """
+        try:
+            response = self.aoss_client.list_collections()
+            for collection in response.get('collectionSummaries', []):
+                if collection.get('name') == collection_name:
+                    return collection.get('id')
+        except Exception as ex:
+            print(f"{Fore.RED}Error getting collection ID: {ex}{Style.RESET_ALL}")
+        return None
+
+    def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
+        """
+        Wait for the collection to become active.
+
+        :param collection_id: ID of the collection
+        :param max_wait_minutes: Maximum wait time in minutes
+        :return: True if active, False otherwise
+        """
+        print(f"Waiting for collection '{self.collection_name}' to become active...")
+        start_time = time.time()
+        while time.time() - start_time < max_wait_minutes * 60:
+            try:
+                response = self.aoss_client.batch_get_collection(ids=[collection_id])
+                status = response['collectionDetails'][0]['status']
+                if status == 'ACTIVE':
+                    print(f"{Fore.GREEN}Collection '{self.collection_name}' is now active.{Style.RESET_ALL}\n")
+                    return True
+                elif status in ['FAILED', 'DELETED']:
+                    print(f"{Fore.RED}Collection creation failed or was deleted. Status: {status}{Style.RESET_ALL}\n")
+                    return False
+                else:
+                    print(f"Collection status: {status}. Waiting...")
+                    time.sleep(30)
+            except Exception as ex:
+                print(f"{Fore.RED}Error checking collection status: {ex}{Style.RESET_ALL}")
+                time.sleep(30)
+        print(f"{Fore.RED}Timed out waiting for collection to become active after {max_wait_minutes} minutes.{Style.RESET_ALL}\n")
+        return False
+
+    def get_collection_endpoint(self):
+        """
+        Retrieve the endpoint URL for the OpenSearch collection.
+
+        :return: Collection endpoint URL if available, None otherwise
+        """
+        try:
+            collection_id = self.get_collection_id(self.collection_name)
+            if not collection_id:
+                print(f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n")
+                return None
+            
+            batch_get_response = self.aoss_client.batch_get_collection(ids=[collection_id])
+            collection_details = batch_get_response.get('collectionDetails', [])
+            
+            if not collection_details:
+                print(f"{Fore.RED}No details found for collection ID '{collection_id}'.{Style.RESET_ALL}\n")
+                return None
+            
+            endpoint = collection_details[0].get('collectionEndpoint')
+            if endpoint:
+                print(f"Collection '{self.collection_name}' has endpoint URL: {endpoint}\n")
+                return endpoint
+            else:
+                print(f"{Fore.RED}No endpoint URL found in collection '{self.collection_name}'.{Style.RESET_ALL}\n")
+                return None
+        except Exception as ex:
+            print(f"{Fore.RED}Error retrieving collection endpoint: {ex}{Style.RESET_ALL}\n")
+            return None
+
+    @staticmethod
+    def get_truncated_name(base_name, max_length=32):
+        """
+        Truncate a name to fit within a specified length.
+
+        :param base_name: Original name
+        :param max_length: Maximum allowed length
+        :return: Truncated name
+        """
+        if len(base_name) <= max_length:
+            return base_name
+        return base_name[:max_length-3] + "..."
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 09a00558..467e95f6 100644
--- a/setup.py
+++ b/setup.py
@@ -103,7 +103,6 @@
         "PyPDF2>=3.0.1",
         "rich>=13.5.2",
         "tiktoken>=0.5.0",
-        "termios>=1.0",
     ],
     python_requires=">=3.8",
     package_data={"opensearch_py_ml": ["py.typed"]},
diff --git a/tests/rag/test_AiConnectorClass.py b/tests/rag/test_AiConnectorClass.py
new file mode 100644
index 00000000..da8007d7
--- /dev/null
+++ b/tests/rag/test_AiConnectorClass.py
@@ -0,0 +1,518 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import patch, MagicMock
+import json
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
+
+class TestAIConnectorHelper(unittest.TestCase):
+    def setUp(self):
+        self.region = 'us-east-1'
+        self.opensearch_domain_name = 'test-domain'
+        self.opensearch_domain_username = 'admin'
+        self.opensearch_domain_password = 'password'
+        self.aws_user_name = 'test-user'
+        self.aws_role_name = 'test-role'
+
+        self.domain_endpoint = 'search-test-domain.us-east-1.es.amazonaws.com'
+        self.domain_arn = 'arn:aws:es:us-east-1:123456789012:domain/test-domain'
+
+    @patch('AIConnectorHelper.IAMRoleHelper')
+    @patch('AIConnectorHelper.SecretHelper')
+    @patch('AIConnectorHelper.OpenSearch')
+    @patch('AIConnectorHelper.AIConnectorHelper.get_opensearch_domain_info')
+    def test___init__(self, mock_get_opensearch_domain_info, mock_opensearch, mock_secret_helper, mock_iam_role_helper):
+        # Mock get_opensearch_domain_info
+        mock_get_opensearch_domain_info.return_value = (self.domain_endpoint, self.domain_arn)
+
+        # Instantiate AIConnectorHelper
+        helper = AIConnectorHelper(
+            self.region,
+            self.opensearch_domain_name,
+            self.opensearch_domain_username,
+            self.opensearch_domain_password,
+            self.aws_user_name,
+            self.aws_role_name
+        )
+
+        # Assert domain URL
+        expected_domain_url = f'https://{self.domain_endpoint}'
+        self.assertEqual(helper.opensearch_domain_url, expected_domain_url)
+
+        # Assert opensearch_client is initialized
+        mock_opensearch.assert_called_once_with(
+            hosts=[{'host': self.domain_endpoint, 'port': 443}],
+            http_auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+            use_ssl=True,
+            verify_certs=True,
+            connection_class=unittest.mock.ANY
+        )
+
+        # Assert IAMRoleHelper and SecretHelper are initialized
+        mock_iam_role_helper.assert_called_once_with(
+            region=self.region,
+            opensearch_domain_url=expected_domain_url,
+            opensearch_domain_username=self.opensearch_domain_username,
+            opensearch_domain_password=self.opensearch_domain_password,
+            aws_user_name=self.aws_user_name,
+            aws_role_name=self.aws_role_name,
+            opensearch_domain_arn=self.domain_arn
+        )
+        mock_secret_helper.assert_called_once_with(self.region)
+
+    @patch('boto3.client')
+    def test_get_opensearch_domain_info_success(self, mock_boto3_client):
+        # Mock the boto3 client
+        mock_client_instance = MagicMock()
+        mock_boto3_client.return_value = mock_client_instance
+
+        # Mock the describe_domain response
+        mock_client_instance.describe_domain.return_value = {
+            'DomainStatus': {
+                'Endpoint': self.domain_endpoint,
+                'ARN': self.domain_arn
+            }
+        }
+
+        # Call the method
+        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+
+        # Assert the results
+        self.assertEqual(endpoint, self.domain_endpoint)
+        self.assertEqual(arn, self.domain_arn)
+        mock_client_instance.describe_domain.assert_called_once_with(DomainName=self.opensearch_domain_name)
+
+    @patch('boto3.client')
+    def test_get_opensearch_domain_info_exception(self, mock_boto3_client):
+        # Mock the boto3 client to raise an exception
+        mock_client_instance = MagicMock()
+        mock_boto3_client.return_value = mock_client_instance
+        mock_client_instance.describe_domain.side_effect = Exception('Test Exception')
+
+        # Call the method
+        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+
+        # Assert the results are None
+        self.assertIsNone(endpoint)
+        self.assertIsNone(arn)
+
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    def test_get_ml_auth_success(self, mock_iam_helper):
+        # Mock the get_role_arn to return a role ARN
+        create_connector_role_name = 'test-create-connector-role'
+        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        mock_iam_helper.get_role_arn.return_value = create_connector_role_arn
+
+        # Mock the assume_role to return temp credentials
+        temp_credentials = {
+            "AccessKeyId": "test-access-key",
+            "SecretAccessKey": "test-secret-key",
+            "SessionToken": "test-session-token"
+        }
+        mock_iam_helper.assume_role.return_value = temp_credentials
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.region = self.region
+            helper.iam_helper = mock_iam_helper
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_arn = self.domain_arn
+
+            # Call the method
+            awsauth = helper.get_ml_auth(create_connector_role_name)
+
+            # Assert that the IAM helper methods were called
+            mock_iam_helper.get_role_arn.assert_called_with(create_connector_role_name)
+            mock_iam_helper.assume_role.assert_called_with(create_connector_role_arn)
+
+            # Assert that AWS4Auth was created with the temp credentials
+            self.assertEqual(awsauth.access_id, temp_credentials["AccessKeyId"])
+            self.assertEqual(awsauth.region, self.region)
+            self.assertEqual(awsauth.service, 'es')
+
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    def test_get_ml_auth_role_not_found(self, mock_iam_helper):
+        # Mock the get_role_arn to return None
+        create_connector_role_name = 'test-create-connector-role'
+        mock_iam_helper.get_role_arn.return_value = None
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.iam_helper = mock_iam_helper
+
+            # Call the method and expect an exception
+            with self.assertRaises(Exception) as context:
+                helper.get_ml_auth(create_connector_role_name)
+
+            self.assertTrue(f"IAM role '{create_connector_role_name}' not found." in str(context.exception))
+
+    @patch('requests.post')
+    @patch('AIConnectorHelper.AWS4Auth')
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    def test_create_connector(self, mock_iam_helper, mock_aws4auth, mock_requests_post):
+        # Mock the IAM helper methods
+        create_connector_role_name = 'test-create-connector-role'
+        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        mock_iam_helper.get_role_arn.return_value = create_connector_role_arn
+        temp_credentials = {
+            "AccessKeyId": "test-access-key",
+            "SecretAccessKey": "test-secret-key",
+            "SessionToken": "test-session-token"
+        }
+        mock_iam_helper.assume_role.return_value = temp_credentials
+
+        # Mock AWS4Auth
+        mock_awsauth = MagicMock()
+        mock_aws4auth.return_value = mock_awsauth
+
+        # Mock requests.post
+        response = MagicMock()
+        response.text = json.dumps({'connector_id': 'test-connector-id'})
+        mock_requests_post.return_value = response
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.region = self.region
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.iam_helper = mock_iam_helper
+
+            # Call the method
+            payload = {'key': 'value'}
+            connector_id = helper.create_connector(create_connector_role_name, payload)
+
+            # Assert that the correct URL was used
+            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/connectors/_create'
+            mock_requests_post.assert_called_once_with(
+                expected_url,
+                auth=mock_awsauth,
+                json=payload,
+                headers={"Content-Type": "application/json"}
+            )
+
+            # Assert that the connector_id is returned
+            self.assertEqual(connector_id, 'test-connector-id')
+
+    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
+    def test_search_model_group(self, mock_model_access_control):
+        # Mock the response from model_access_control.search_model_group_by_name
+        model_group_name = 'test-model-group'
+        mock_response = {'hits': {'hits': []}}
+        mock_model_access_control.search_model_group_by_name.return_value = mock_response
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.model_access_control = mock_model_access_control
+
+            # Call the method
+            response = helper.search_model_group(model_group_name, 'test-create-connector-role')
+
+            # Assert that the method was called with correct parameters
+            mock_model_access_control.search_model_group_by_name.assert_called_once_with(model_group_name, size=1)
+
+            # Assert that the response is as expected
+            self.assertEqual(response, mock_response)
+
+    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
+    def test_create_model_group_exists(self, mock_model_access_control):
+        # Mock the get_model_group_id_by_name to return an ID
+        model_group_name = 'test-model-group'
+        model_group_id = 'test-model-group-id'
+        mock_model_access_control.get_model_group_id_by_name.return_value = model_group_id
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.model_access_control = mock_model_access_control
+
+            # Call the method
+            result = helper.create_model_group(model_group_name, 'test description', 'test-create-connector-role')
+
+            # Assert that the ID is returned
+            self.assertEqual(result, model_group_id)
+
+    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
+    def test_create_model_group_new(self, mock_model_access_control):
+        # Mock the get_model_group_id_by_name to return None initially, then an ID
+        model_group_name = 'test-model-group'
+        model_group_id = 'test-model-group-id'
+
+        # First call returns None, second call returns the ID
+        mock_model_access_control.get_model_group_id_by_name.side_effect = [None, model_group_id]
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.model_access_control = mock_model_access_control
+
+            # Call the method
+            result = helper.create_model_group(model_group_name, 'test description', 'test-create-connector-role')
+
+            # Assert that register_model_group was called
+            mock_model_access_control.register_model_group.assert_called_once_with(name=model_group_name, description='test description')
+
+            # Assert that the ID is returned
+            self.assertEqual(result, model_group_id)
+
+    @patch.object(AIConnectorHelper, 'get_task')
+    @patch('time.sleep', return_value=None)
+    @patch('requests.post')
+    @patch.object(AIConnectorHelper, 'get_ml_auth')
+    @patch.object(AIConnectorHelper, 'create_model_group')
+    def test_create_model(self, mock_create_model_group, mock_get_ml_auth, mock_requests_post, mock_sleep, mock_get_task):
+        # Mock create_model_group
+        model_group_id = 'test-model-group-id'
+        mock_create_model_group.return_value = model_group_id
+
+        # Mock get_ml_auth
+        mock_awsauth = MagicMock()
+        mock_get_ml_auth.return_value = mock_awsauth
+
+        # Mock requests.post
+        response = MagicMock()
+        response.text = json.dumps({'model_id': 'test-model-id'})
+        mock_requests_post.return_value = response
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+
+            # Call the method
+            model_id = helper.create_model('test-model', 'test description', 'test-connector-id', 'test-create-connector-role', deploy=True)
+
+            # Assert that create_model_group was called
+            mock_create_model_group.assert_called_once_with('test-model', 'test description', 'test-create-connector-role')
+
+            # Assert that the correct URL was used
+            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/_register?deploy=true'
+            payload = {
+                "name": 'test-model',
+                "function_name": "remote",
+                "description": 'test description',
+                "model_group_id": model_group_id,
+                "connector_id": 'test-connector-id'
+            }
+            mock_requests_post.assert_called_once_with(
+                expected_url,
+                auth=mock_awsauth,
+                json=payload,
+                headers={"Content-Type": "application/json"}
+            )
+
+            # Assert that model_id is returned
+            self.assertEqual(model_id, 'test-model-id')
+
+    @patch('requests.post')
+    def test_deploy_model(self, mock_requests_post):
+        # Mock requests.post
+        response = MagicMock()
+        response.text = 'Deploy model response'
+        mock_requests_post.return_value = response
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_username = self.opensearch_domain_username
+            helper.opensearch_domain_password = self.opensearch_domain_password
+
+            # Call the method
+            result = helper.deploy_model('test-model-id')
+
+            # Assert that the correct URL was used
+            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_deploy'
+            mock_requests_post.assert_called_once_with(
+                expected_url,
+                auth=unittest.mock.ANY,
+                headers={"Content-Type": "application/json"}
+            )
+
+            # Assert that the response is returned
+            self.assertEqual(result, response)
+
+    @patch('requests.post')
+    def test_predict(self, mock_requests_post):
+        # Mock requests.post
+        response = MagicMock()
+        response.text = 'Predict response'
+        mock_requests_post.return_value = response
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_username = self.opensearch_domain_username
+            helper.opensearch_domain_password = self.opensearch_domain_password
+
+            # Call the method
+            payload = {'input': 'test input'}
+            result = helper.predict('test-model-id', payload)
+
+            # Assert that the correct URL was used
+            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_predict'
+            mock_requests_post.assert_called_once_with(
+                expected_url,
+                auth=unittest.mock.ANY,
+                json=payload,
+                headers={"Content-Type": "application/json"}
+            )
+
+            # Assert that the response is returned
+            self.assertEqual(result, response)
+
+    @patch('time.sleep', return_value=None)
+    @patch.object(AIConnectorHelper, 'create_connector')
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    @patch.object(AIConnectorHelper, 'secret_helper', create=True)
+    def test_create_connector_with_secret(self, mock_secret_helper, mock_iam_helper, mock_create_connector, mock_sleep):
+        # Mock secret_helper methods
+        secret_name = 'test-secret'
+        secret_value = 'test-secret-value'
+        secret_arn = 'arn:aws:secretsmanager:us-east-1:123456789012:secret:test-secret'
+        mock_secret_helper.secret_exists.return_value = False
+        mock_secret_helper.create_secret.return_value = secret_arn
+        mock_secret_helper.get_secret_arn.return_value = secret_arn
+
+        # Mock iam_helper methods
+        connector_role_name = 'test-connector-role'
+        create_connector_role_name = 'test-create-connector-role'
+        connector_role_arn = 'arn:aws:iam::123456789012:role/test-connector-role'
+        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        mock_iam_helper.role_exists.side_effect = [False, False]
+        mock_iam_helper.create_iam_role.side_effect = [connector_role_arn, create_connector_role_arn]
+        mock_iam_helper.get_user_arn.return_value = 'arn:aws:iam::123456789012:user/test-user'
+        mock_iam_helper.get_role_arn.side_effect = [connector_role_arn, create_connector_role_arn]
+        mock_iam_helper.map_iam_role_to_backend_role.return_value = None
+
+        # Mock create_connector
+        connector_id = 'test-connector-id'
+        mock_create_connector.return_value = connector_id
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.region = self.region
+            helper.aws_user_name = self.aws_user_name
+            helper.aws_role_name = self.aws_role_name
+            helper.opensearch_domain_arn = self.domain_arn
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.iam_helper = mock_iam_helper
+            helper.secret_helper = mock_secret_helper
+
+            # Prepare input
+            create_connector_input = {'key': 'value'}
+
+            # Call the method
+            result = helper.create_connector_with_secret(
+                secret_name,
+                secret_value,
+                connector_role_name,
+                create_connector_role_name,
+                create_connector_input,
+                sleep_time_in_seconds=0  # For faster testing
+            )
+
+            # Assert that the methods were called
+            mock_secret_helper.secret_exists.assert_called_once_with(secret_name)
+            mock_secret_helper.create_secret.assert_called_once_with(secret_name, secret_value)
+
+            self.assertEqual(mock_iam_helper.role_exists.call_count, 2)
+            self.assertEqual(mock_iam_helper.create_iam_role.call_count, 2)
+            mock_iam_helper.map_iam_role_to_backend_role.assert_called_once_with(create_connector_role_arn)
+
+            # Assert that create_connector was called
+            payload = create_connector_input.copy()
+            payload['credential'] = {
+                "secretArn": secret_arn,
+                "roleArn": connector_role_arn
+            }
+            mock_create_connector.assert_called_once_with(create_connector_role_name, payload)
+
+            # Assert that the connector_id is returned
+            self.assertEqual(result, connector_id)
+
+    @patch('time.sleep', return_value=None)
+    @patch.object(AIConnectorHelper, 'create_connector')
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    def test_create_connector_with_role(self, mock_iam_helper, mock_create_connector, mock_sleep):
+        # Mock iam_helper methods
+        connector_role_name = 'test-connector-role'
+        create_connector_role_name = 'test-create-connector-role'
+        connector_role_arn = 'arn:aws:iam::123456789012:role/test-connector-role'
+        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        mock_iam_helper.role_exists.side_effect = [False, False]
+        mock_iam_helper.create_iam_role.side_effect = [connector_role_arn, create_connector_role_arn]
+        mock_iam_helper.get_user_arn.return_value = 'arn:aws:iam::123456789012:user/test-user'
+        mock_iam_helper.get_role_arn.side_effect = [connector_role_arn, create_connector_role_arn]
+        mock_iam_helper.map_iam_role_to_backend_role.return_value = None
+
+        # Mock create_connector
+        connector_id = 'test-connector-id'
+        mock_create_connector.return_value = connector_id
+
+        # Instantiate helper
+        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+            helper = AIConnectorHelper()
+            helper.region = self.region
+            helper.aws_user_name = self.aws_user_name
+            helper.aws_role_name = self.aws_role_name
+            helper.opensearch_domain_arn = self.domain_arn
+            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.iam_helper = mock_iam_helper
+
+            # Prepare input
+            create_connector_input = {'key': 'value'}
+            connector_role_inline_policy = {'Statement': []}
+
+            # Call the method
+            result = helper.create_connector_with_role(
+                connector_role_inline_policy,
+                connector_role_name,
+                create_connector_role_name,
+                create_connector_input,
+                sleep_time_in_seconds=0  # For faster testing
+            )
+
+            # Assert that the methods were called
+            self.assertEqual(mock_iam_helper.role_exists.call_count, 2)
+            self.assertEqual(mock_iam_helper.create_iam_role.call_count, 2)
+            mock_iam_helper.map_iam_role_to_backend_role.assert_called_once_with(create_connector_role_arn)
+
+            # Assert that create_connector was called
+            payload = create_connector_input.copy()
+            payload['credential'] = {
+                "roleArn": connector_role_arn
+            }
+            mock_create_connector.assert_called_once_with(create_connector_role_name, payload)
+
+            # Assert that the connector_id is returned
+            self.assertEqual(result, connector_id)
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_IAMRoleHelper.py b/tests/rag/test_IAMRoleHelper.py
new file mode 100644
index 00000000..035a752d
--- /dev/null
+++ b/tests/rag/test_IAMRoleHelper.py
@@ -0,0 +1,320 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import patch, MagicMock
+from botocore.exceptions import ClientError
+import json
+import logging
+
+# Assuming IAMRoleHelper is defined in iam_role_helper.py
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper  # Replace with the actual module path if different
+
+class TestIAMRoleHelper(unittest.TestCase):
+
+    def setUp(self):
+        self.region = 'us-east-1'
+        self.iam_helper = IAMRoleHelper(region=self.region)
+
+        # Configure logging to suppress error logs during tests
+        logger = logging.getLogger('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper')
+        logger.setLevel(logging.CRITICAL)  # Suppress logs below CRITICAL during tests
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_role_exists_true(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        mock_iam_client.get_role.return_value = {'Role': {'RoleName': 'test-role'}}
+
+        result = self.iam_helper.role_exists('test-role')
+
+        self.assertTrue(result)
+        mock_iam_client.get_role.assert_called_with(RoleName='test-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_role_exists_false(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        error_response = {
+            'Error': {
+                'Code': 'NoSuchEntity',
+                'Message': 'Role does not exist'
+            }
+        }
+        mock_iam_client.get_role.side_effect = ClientError(error_response, 'GetRole')
+
+        result = self.iam_helper.role_exists('nonexistent-role')
+
+        self.assertFalse(result)
+        mock_iam_client.get_role.assert_called_with(RoleName='nonexistent-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_delete_role_success(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        # Mock responses for list_attached_role_policies and list_role_policies
+        mock_iam_client.list_attached_role_policies.return_value = {
+            'AttachedPolicies': [{'PolicyArn': 'arn:aws:iam::aws:policy/ExamplePolicy'}]
+        }
+        mock_iam_client.list_role_policies.return_value = {
+            'PolicyNames': ['InlinePolicy']
+        }
+
+        self.iam_helper.delete_role('test-role')
+
+        mock_iam_client.detach_role_policy.assert_called_with(RoleName='test-role', PolicyArn='arn:aws:iam::aws:policy/ExamplePolicy')
+        mock_iam_client.delete_role_policy.assert_called_with(RoleName='test-role', PolicyName='InlinePolicy')
+        mock_iam_client.delete_role.assert_called_with(RoleName='test-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_delete_role_not_exist(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        error_response = {
+            'Error': {
+                'Code': 'NoSuchEntity',
+                'Message': 'Role does not exist'
+            }
+        }
+        mock_iam_client.list_attached_role_policies.side_effect = ClientError(error_response, 'ListAttachedRolePolicies')
+
+        self.iam_helper.delete_role('nonexistent-role')
+
+        mock_iam_client.list_attached_role_policies.assert_called_with(RoleName='nonexistent-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_create_iam_role_success(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        trust_policy = {"Version": "2012-10-17", "Statement": []}
+        inline_policy = {"Version": "2012-10-17", "Statement": []}
+
+        mock_iam_client.create_role.return_value = {
+            'Role': {'Arn': 'arn:aws:iam::123456789012:role/test-role'}
+        }
+
+        role_arn = self.iam_helper.create_iam_role('test-role', trust_policy, inline_policy)
+
+        self.assertEqual(role_arn, 'arn:aws:iam::123456789012:role/test-role')
+        mock_iam_client.create_role.assert_called_with(
+            RoleName='test-role',
+            AssumeRolePolicyDocument=json.dumps(trust_policy),
+            Description='Role with custom trust and inline policies',
+        )
+        mock_iam_client.put_role_policy.assert_called_with(
+            RoleName='test-role',
+            PolicyName='InlinePolicy',
+            PolicyDocument=json.dumps(inline_policy)
+        )
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_create_iam_role_error(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        trust_policy = {"Version": "2012-10-17", "Statement": []}
+        inline_policy = {"Version": "2012-10-17", "Statement": []}
+
+        error_response = {
+            'Error': {
+                'Code': 'EntityAlreadyExists',
+                'Message': 'Role already exists'
+            }
+        }
+        mock_iam_client.create_role.side_effect = ClientError(error_response, 'CreateRole')
+
+        role_arn = self.iam_helper.create_iam_role('existing-role', trust_policy, inline_policy)
+
+        self.assertIsNone(role_arn)
+        mock_iam_client.create_role.assert_called_with(
+            RoleName='existing-role',
+            AssumeRolePolicyDocument=json.dumps(trust_policy),
+            Description='Role with custom trust and inline policies',
+        )
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_get_role_arn_success(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        mock_iam_client.get_role.return_value = {
+            'Role': {'Arn': 'arn:aws:iam::123456789012:role/test-role'}
+        }
+
+        role_arn = self.iam_helper.get_role_arn('test-role')
+
+        self.assertEqual(role_arn, 'arn:aws:iam::123456789012:role/test-role')
+        mock_iam_client.get_role.assert_called_with(RoleName='test-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_get_role_arn_not_found(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        error_response = {
+            'Error': {
+                'Code': 'NoSuchEntity',
+                'Message': 'Role does not exist'
+            }
+        }
+        mock_iam_client.get_role.side_effect = ClientError(error_response, 'GetRole')
+
+        role_arn = self.iam_helper.get_role_arn('nonexistent-role')
+
+        self.assertIsNone(role_arn)
+        mock_iam_client.get_role.assert_called_with(RoleName='nonexistent-role')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_get_user_arn_success(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        mock_iam_client.get_user.return_value = {
+            'User': {'Arn': 'arn:aws:iam::123456789012:user/test-user'}
+        }
+
+        user_arn = self.iam_helper.get_user_arn('test-user')
+
+        self.assertEqual(user_arn, 'arn:aws:iam::123456789012:user/test-user')
+        mock_iam_client.get_user.assert_called_with(UserName='test-user')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_get_user_arn_not_found(self, mock_boto_client):
+        mock_iam_client = MagicMock()
+        mock_boto_client.return_value = mock_iam_client
+
+        error_response = {
+            'Error': {
+                'Code': 'NoSuchEntity',
+                'Message': 'User does not exist'
+            }
+        }
+        mock_iam_client.get_user.side_effect = ClientError(error_response, 'GetUser')
+
+        user_arn = self.iam_helper.get_user_arn('nonexistent-user')
+
+        self.assertIsNone(user_arn)
+        mock_iam_client.get_user.assert_called_with(UserName='nonexistent-user')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_assume_role_success(self, mock_boto_client):
+        mock_sts_client = MagicMock()
+        mock_boto_client.return_value = mock_sts_client
+
+        mock_sts_client.assume_role.return_value = {
+            'Credentials': {
+                'AccessKeyId': 'ASIA...',
+                'SecretAccessKey': 'secret',
+                'SessionToken': 'token'
+            }
+        }
+
+        role_arn = 'arn:aws:iam::123456789012:role/test-role'
+        credentials = self.iam_helper.assume_role(role_arn, 'test-session')
+
+        self.assertIsNotNone(credentials)
+        self.assertEqual(credentials['AccessKeyId'], 'ASIA...')
+        mock_sts_client.assume_role.assert_called_with(
+            RoleArn=role_arn,
+            RoleSessionName='test-session',
+        )
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    def test_assume_role_failure(self, mock_boto_client):
+        mock_sts_client = MagicMock()
+        mock_boto_client.return_value = mock_sts_client
+
+        error_response = {
+            'Error': {
+                'Code': 'AccessDenied',
+                'Message': 'User is not authorized to perform: sts:AssumeRole'
+            }
+        }
+        mock_sts_client.assume_role.side_effect = ClientError(error_response, 'AssumeRole')
+
+        role_arn = 'arn:aws:iam::123456789012:role/unauthorized-role'
+        credentials = self.iam_helper.assume_role(role_arn, 'test-session')
+
+        self.assertIsNone(credentials)
+        mock_sts_client.assume_role.assert_called_with(
+            RoleArn=role_arn,
+            RoleSessionName='test-session',
+        )
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.requests.put')
+    def test_map_iam_role_to_backend_role_success(self, mock_put):
+        mock_response = MagicMock()
+        mock_response.status_code = 200
+        mock_put.return_value = mock_response
+
+        self.iam_helper.opensearch_domain_url = 'https://search-domain'
+        self.iam_helper.opensearch_domain_username = 'user'
+        self.iam_helper.opensearch_domain_password = 'pass'
+
+        iam_role_arn = 'arn:aws:iam::123456789012:role/test-role'
+
+        self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
+
+        mock_put.assert_called_once()
+        args, kwargs = mock_put.call_args
+        self.assertIn('/_plugins/_security/api/rolesmapping/ml_full_access', args[0])
+        self.assertEqual(kwargs['auth'], ('user', 'pass'))
+        self.assertEqual(kwargs['json'], {'backend_roles': [iam_role_arn]})
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.requests.put')
+    def test_map_iam_role_to_backend_role_failure(self, mock_put):
+        mock_response = MagicMock()
+        mock_response.status_code = 403
+        mock_response.text = 'Forbidden'
+        mock_put.return_value = mock_response
+
+        self.iam_helper.opensearch_domain_url = 'https://search-domain'
+        self.iam_helper.opensearch_domain_username = 'user'
+        self.iam_helper.opensearch_domain_password = 'pass'
+
+        iam_role_arn = 'arn:aws:iam::123456789012:role/test-role'
+
+        self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
+
+        mock_put.assert_called_once()
+        args, kwargs = mock_put.call_args
+        self.assertIn('/_plugins/_security/api/rolesmapping/ml_full_access', args[0])
+
+    def test_get_iam_user_name_from_arn_valid(self):
+        iam_principal_arn = 'arn:aws:iam::123456789012:user/test-user'
+        user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
+        self.assertEqual(user_name, 'test-user')
+
+    def test_get_iam_user_name_from_arn_invalid(self):
+        iam_principal_arn = 'arn:aws:iam::123456789012:role/test-role'
+        user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
+        self.assertIsNone(user_name)
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_Model_Register.py b/tests/rag/test_Model_Register.py
new file mode 100644
index 00000000..530149df
--- /dev/null
+++ b/tests/rag/test_Model_Register.py
@@ -0,0 +1,201 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import patch, MagicMock, Mock
+import sys
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
+
+
+class TestModelRegister(unittest.TestCase):
+    def setUp(self):
+        # Sample configuration dictionary
+        self.config = {
+            'region': 'us-east-1',
+            'opensearch_username': 'admin',
+            'opensearch_password': 'admin',
+            'iam_principal': 'arn:aws:iam::123456789012:user/test-user',
+            'service_type': 'managed',
+            'embedding_dimension': '768',
+            'opensearch_endpoint': 'https://search-domain'
+        }
+        # Mock OpenSearch client
+        self.mock_opensearch_client = MagicMock()
+        # OpenSearch domain name
+        self.opensearch_domain_name = 'test-domain'
+
+        # Correct the patch paths to match the actual module structure
+        self.patcher_iam_role_helper = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.IAMRoleHelper')
+        self.MockIAMRoleHelper = self.patcher_iam_role_helper.start()
+
+        self.patcher_ai_connector_helper = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.AIConnectorHelper')
+        self.MockAIConnectorHelper = self.patcher_ai_connector_helper.start()
+
+        # Patch model classes
+        self.patcher_bedrock_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.BedrockModel')
+        self.MockBedrockModel = self.patcher_bedrock_model.start()
+
+        self.patcher_openai_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.OpenAIModel')
+        self.MockOpenAIModel = self.patcher_openai_model.start()
+
+        self.patcher_cohere_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CohereModel')
+        self.MockCohereModel = self.patcher_cohere_model.start()
+
+        self.patcher_huggingface_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.HuggingFaceModel')
+        self.MockHuggingFaceModel = self.patcher_huggingface_model.start()
+
+        self.patcher_custom_pytorch_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CustomPyTorchModel')
+        self.MockCustomPyTorchModel = self.patcher_custom_pytorch_model.start()
+
+    def tearDown(self):
+        self.patcher_iam_role_helper.stop()
+        self.patcher_ai_connector_helper.stop()
+        self.patcher_bedrock_model.stop()
+        self.patcher_openai_model.stop()
+        self.patcher_cohere_model.stop()
+        self.patcher_huggingface_model.stop()
+        self.patcher_custom_pytorch_model.stop()
+
+    @patch('boto3.client')
+    def test_initialize_clients_success(self, mock_boto_client):
+        mock_boto_client.return_value = MagicMock()
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        result = model_register.initialize_clients()
+        self.assertTrue(result)
+        mock_boto_client.assert_called_with('bedrock-runtime', region_name='us-east-1')
+
+    @patch('boto3.client')
+    def test_initialize_clients_failure(self, mock_boto_client):
+        mock_boto_client.side_effect = Exception('Client creation failed')
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        result = model_register.initialize_clients()
+        self.assertFalse(result)
+        mock_boto_client.assert_called_with('bedrock-runtime', region_name='us-east-1')
+
+    @patch('builtins.input', side_effect=['1'])
+    def test_prompt_model_registration_register_new_model(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with patch.object(model_register, 'register_model_interactive') as mock_register_model_interactive:
+            model_register.prompt_model_registration()
+            mock_register_model_interactive.assert_called_once()
+
+    @patch('builtins.input', side_effect=['2', 'model-id-123'])
+    def test_prompt_model_registration_use_existing_model(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with patch.object(model_register, 'save_config') as mock_save_config:
+            model_register.prompt_model_registration()
+            self.assertEqual(model_register.config['embedding_model_id'], 'model-id-123')
+            mock_save_config.assert_called_once_with(model_register.config)
+
+    @patch('builtins.input', side_effect=['invalid'])
+    def test_prompt_model_registration_invalid_choice(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with self.assertRaises(SystemExit):
+            model_register.prompt_model_registration()
+
+    @patch('builtins.input', side_effect=['1'])
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
+    def test_register_model_interactive_bedrock(self, mock_initialize_clients, mock_input):
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register.register_model_interactive()
+
+        self.MockBedrockModel.return_value.register_bedrock_model.assert_called_once()
+
+    @patch('builtins.input', side_effect=['2'])
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
+    def test_register_model_interactive_openai_managed(self, mock_initialize_clients, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register.service_type = 'managed'
+
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+
+        model_register.register_model_interactive()
+
+        self.MockOpenAIModel.return_value.register_openai_model.assert_called_once()
+
+    @patch('builtins.input', side_effect=['2'])
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
+    def test_register_model_interactive_openai_opensource(self, mock_initialize_clients, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register.service_type = 'open-source'
+
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+
+        model_register.register_model_interactive()
+
+        self.MockOpenAIModel.return_value.register_openai_model_opensource.assert_called_once()
+
+    @patch('builtins.input', side_effect=['invalid'])
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
+    def test_register_model_interactive_invalid_choice(self, mock_initialize_clients, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+
+        with patch('builtins.print') as mock_print:
+            model_register.register_model_interactive()
+            mock_print.assert_called_with('\x1b[31mInvalid choice. Exiting model registration.\x1b[0m')
+
+    @patch('builtins.input', side_effect=['1'])
+    def test_prompt_opensource_model_registration_register_now(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with patch.object(model_register, 'register_model_opensource_interactive') as mock_register:
+            model_register.prompt_opensource_model_registration()
+            mock_register.assert_called_once()
+
+    @patch('builtins.input', side_effect=['2'])
+    def test_prompt_opensource_model_registration_register_later(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with patch('builtins.print') as mock_print:
+            model_register.prompt_opensource_model_registration()
+            mock_print.assert_called_with('Skipping model registration. You can register models later using the appropriate commands.')
+
+    @patch('builtins.input', side_effect=['invalid'])
+    def test_prompt_opensource_model_registration_invalid_choice(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        with patch('builtins.print') as mock_print:
+            model_register.prompt_opensource_model_registration()
+            mock_print.assert_called_with('\x1b[31mInvalid choice. Skipping model registration.\x1b[0m')
+
+    @patch('builtins.input', side_effect=['3'])
+    def test_register_model_opensource_interactive_huggingface(self, mock_input):
+        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register.service_type = 'open-source'
+
+        model_register.register_model_opensource_interactive()
+
+        self.MockHuggingFaceModel.return_value.register_huggingface_model.assert_called_once_with(
+            model_register.opensearch_client, model_register.config, model_register.save_config
+        )
+
+    @patch('builtins.input', side_effect=['1'])
+    def test_register_model_opensource_interactive_no_opensearch_client(self, mock_input):
+        model_register = ModelRegister(self.config, None, self.opensearch_domain_name)
+        with patch('builtins.print') as mock_print:
+            model_register.register_model_opensource_interactive()
+            mock_print.assert_called_with('\x1b[31mOpenSearch client is not initialized. Please run setup again.\x1b[0m')
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_SecretsHelper b/tests/rag/test_SecretsHelper
new file mode 100644
index 00000000..be00dc24
--- /dev/null
+++ b/tests/rag/test_SecretsHelper
@@ -0,0 +1,137 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import patch, MagicMock
+from botocore.exceptions import ClientError
+import json
+import logging
+# Adjust the import path as necessary
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper import SecretHelper
+
+class TestSecretHelper(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        # Suppress logging below ERROR level during tests
+        logging.basicConfig(level=logging.ERROR)
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_create_secret_error_logging(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        error_response = {
+            'Error': {
+                'Code': 'InternalServiceError',
+                'Message': 'An unspecified error occurred'
+            }
+        }
+        mock_secretsmanager.create_secret.side_effect = ClientError(error_response, 'CreateSecret')
+
+        secret_helper = SecretHelper(region='us-east-1')
+        with self.assertLogs('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper', level='ERROR') as cm:
+            result = secret_helper.create_secret('new-secret', {'key': 'value'})
+            self.assertIsNone(result)
+        self.assertIn('Error creating secret', cm.output[0])
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_get_secret_arn_success(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        mock_secretsmanager.describe_secret.return_value = {
+            'ARN': 'arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret'
+        }
+
+        secret_helper = SecretHelper(region='us-east-1')
+        result = secret_helper.get_secret_arn('my-secret')
+        self.assertEqual(result, 'arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret')
+        mock_secretsmanager.describe_secret.assert_called_with(SecretId='my-secret')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_get_secret_arn_not_found(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        error_response = {
+            'Error': {
+                'Code': 'ResourceNotFoundException',
+                'Message': 'Secret not found'
+            }
+        }
+        mock_secretsmanager.describe_secret.side_effect = ClientError(error_response, 'DescribeSecret')
+
+        secret_helper = SecretHelper(region='us-east-1')
+        result = secret_helper.get_secret_arn('nonexistent-secret')
+        self.assertIsNone(result)
+        mock_secretsmanager.describe_secret.assert_called_with(SecretId='nonexistent-secret')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_get_secret_success(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        mock_secretsmanager.get_secret_value.return_value = {'SecretString': 'my-secret-value'}
+
+        secret_helper = SecretHelper(region='us-east-1')
+        result = secret_helper.get_secret('my-secret')
+        self.assertEqual(result, 'my-secret-value')
+        mock_secretsmanager.get_secret_value.assert_called_with(SecretId='my-secret')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_get_secret_not_found(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        error_response = {
+            'Error': {
+                'Code': 'ResourceNotFoundException',
+                'Message': 'Secret not found'
+            }
+        }
+        mock_secretsmanager.get_secret_value.side_effect = ClientError(error_response, 'GetSecretValue')
+
+        secret_helper = SecretHelper(region='us-east-1')
+        result = secret_helper.get_secret('nonexistent-secret')
+        self.assertIsNone(result)
+        mock_secretsmanager.get_secret_value.assert_called_with(SecretId='nonexistent-secret')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    def test_create_secret_success(self, mock_boto_client):
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        mock_secretsmanager.create_secret.return_value = {
+            'ARN': 'arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret'
+        }
+
+        secret_helper = SecretHelper(region='us-east-1')
+        result = secret_helper.create_secret('new-secret', {'key': 'value'})
+        self.assertEqual(result, 'arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret')
+        mock_secretsmanager.create_secret.assert_called_with(
+            Name='new-secret',
+            SecretString=json.dumps({'key': 'value'})
+        )
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_ingest.py b/tests/rag/test_ingest.py
new file mode 100644
index 00000000..ac4c9f10
--- /dev/null
+++ b/tests/rag/test_ingest.py
@@ -0,0 +1,223 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import patch, MagicMock, mock_open
+import os
+import io
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest import Ingest
+from opensearchpy import exceptions as opensearch_exceptions
+import json
+
+class TestIngest(unittest.TestCase):
+    def setUp(self):
+        self.config = {
+            'region': 'us-east-1',
+            'index_name': 'test-index',
+            'embedding_model_id': 'test-embedding-model-id',
+            'ingest_pipeline_name': 'test-ingest-pipeline'
+        }
+        self.ingest = Ingest(self.config)
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector')
+    def test_initialize_clients_success(self, mock_opensearch_connector):
+        mock_instance = mock_opensearch_connector.return_value
+        mock_instance.initialize_opensearch_client.return_value = True
+
+        ingest = Ingest(self.config)
+        result = ingest.initialize_clients()
+
+        self.assertTrue(result)
+        mock_instance.initialize_opensearch_client.assert_called_once()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector')
+    def test_initialize_clients_failure(self, mock_opensearch_connector):
+        mock_instance = mock_opensearch_connector.return_value
+        mock_instance.initialize_opensearch_client.return_value = False
+
+        ingest = Ingest(self.config)
+        result = ingest.initialize_clients()
+
+        self.assertFalse(result)
+        mock_instance.initialize_opensearch_client.assert_called_once()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir')
+    def test_ingest_command_with_valid_files(self, mock_isdir, mock_walk, mock_isfile):
+        paths = ['/path/to/dir', '/path/to/file.txt']
+        mock_isfile.side_effect = lambda x: x == '/path/to/file.txt'
+        mock_isdir.side_effect = lambda x: x == '/path/to/dir'
+        mock_walk.return_value = [('/path/to/dir', [], ['file3.pdf'])]
+
+        with patch.object(self.ingest, 'process_and_ingest_data') as mock_process_and_ingest_data:
+            self.ingest.ingest_command(paths)
+            mock_process_and_ingest_data.assert_called_once()
+            args, kwargs = mock_process_and_ingest_data.call_args
+            expected_files = ['/path/to/file.txt', '/path/to/dir/file3.pdf']
+            self.assertCountEqual(args[0], expected_files)
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir')
+    def test_ingest_command_no_valid_files(self, mock_isdir, mock_walk, mock_isfile):
+        paths = ['/invalid/path']
+        mock_isfile.return_value = False
+        mock_isdir.return_value = False
+
+        with patch('builtins.print') as mock_print:
+            self.ingest.ingest_command(paths)
+            mock_print.assert_any_call('\x1b[33mInvalid path: /invalid/path\x1b[0m')
+            mock_print.assert_any_call('\x1b[31mNo valid files found for ingestion.\x1b[0m')
+
+    @patch.object(Ingest, 'initialize_clients', return_value=True)
+    @patch.object(Ingest, 'create_ingest_pipeline')
+    @patch.object(Ingest, 'process_file')
+    @patch.object(Ingest, 'text_embedding', return_value=[0.1, 0.2, 0.3])
+    def test_process_and_ingest_data(self, mock_text_embedding, mock_process_file, mock_create_pipeline, mock_initialize_clients):
+        file_paths = ['/path/to/file1.txt']
+        documents = [{'text': 'Sample text'}]
+        mock_process_file.return_value = documents
+
+        # Patch the 'bulk_index' method on the instance's 'opensearch' attribute
+        with patch.object(self.ingest.opensearch, 'bulk_index', return_value=(1, 0)) as mock_bulk_index:
+            self.ingest.process_and_ingest_data(file_paths)
+
+            mock_initialize_clients.assert_called_once()
+            mock_create_pipeline.assert_called_once_with(self.ingest.pipeline_name)
+            mock_process_file.assert_called_once_with('/path/to/file1.txt')
+            mock_text_embedding.assert_called_once_with('Sample text')
+            mock_bulk_index.assert_called_once()
+
+    def test_create_ingest_pipeline_exists(self):
+        pipeline_id = 'test-pipeline'
+        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.ingest.get_pipeline.return_value = {}
+
+            with patch('builtins.print') as mock_print:
+                self.ingest.create_ingest_pipeline(pipeline_id)
+                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(id=pipeline_id)
+                mock_print.assert_any_call(f"\nIngest pipeline '{pipeline_id}' already exists.")
+
+    def test_create_ingest_pipeline_not_exists(self):
+        pipeline_id = 'test-pipeline'
+        pipeline_body = {
+            "description": "A text chunking ingest pipeline",
+            "processors": [
+                {
+                    "text_chunking": {
+                        "algorithm": {
+                            "fixed_token_length": {
+                                "token_limit": 384,
+                                "overlap_rate": 0.2,
+                                "tokenizer": "standard"
+                            }
+                        },
+                        "field_map": {
+                            "nominee_text": "passage_chunk"
+                        }
+                    }
+                }
+            ]
+        }
+
+        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.ingest.get_pipeline.side_effect = opensearch_exceptions.NotFoundError(
+                404, "Not Found", {"error": "Pipeline not found"}
+            )
+
+            with patch('builtins.print') as mock_print:
+                self.ingest.create_ingest_pipeline(pipeline_id)
+
+                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(id=pipeline_id)
+                mock_opensearch_client.ingest.put_pipeline.assert_called_once_with(id=pipeline_id, body=pipeline_body)
+                mock_print.assert_any_call(f"\nIngest pipeline '{pipeline_id}' created successfully.")
+
+    @patch('builtins.open', new_callable=mock_open, read_data='col1,col2\nvalue1,value2\n')
+    def test_process_csv(self, mock_file):
+        file_path = '/path/to/file.csv'
+        with patch('csv.DictReader') as mock_csv_reader:
+            mock_csv_reader.return_value = [{'col1': 'value1', 'col2': 'value2'}]
+            result = self.ingest.process_csv(file_path)
+            mock_file.assert_called_once_with(file_path, 'r', newline='', encoding='utf-8')
+            self.assertEqual(result, [{'text': json.dumps({'col1': 'value1', 'col2': 'value2'})}])
+
+    @patch('builtins.open', new_callable=mock_open, read_data='Sample TXT data')
+    def test_process_txt(self, mock_file):
+        file_path = '/path/to/file.txt'
+        result = self.ingest.process_txt(file_path)
+        mock_file.assert_called_once_with(file_path, 'r')
+        self.assertEqual(result, [{'text': 'Sample TXT data'}])
+
+    @patch('PyPDF2.PdfReader')
+    @patch('builtins.open', new_callable=mock_open)
+    def test_process_pdf(self, mock_file, mock_pdf_reader):
+        file_path = '/path/to/file.pdf'
+        mock_pdf_reader_instance = mock_pdf_reader.return_value
+        mock_page = MagicMock()
+        mock_page.extract_text.return_value = 'Sample PDF page text'
+        mock_pdf_reader_instance.pages = [mock_page]
+
+        result = self.ingest.process_pdf(file_path)
+
+        mock_file.assert_called_once_with(file_path, 'rb')
+        mock_pdf_reader.assert_called_once_with(mock_file.return_value)
+        self.assertEqual(result, [{'text': 'Sample PDF page text'}])
+
+    @patch('time.sleep', return_value=None)
+    def test_text_embedding_failure(self, mock_sleep):
+        text = 'Sample text'
+
+        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.transport.perform_request.side_effect = Exception('Test exception')
+
+            with patch('builtins.print') as mock_print:
+                with self.assertRaises(Exception) as context:
+                    self.ingest.text_embedding(text, max_retries=1)
+                self.assertTrue('Test exception' in str(context.exception))
+                mock_print.assert_any_call('Error on attempt 1: Test exception')
+
+    def test_text_embedding_success(self):
+        text = 'Sample text'
+        embedding = [0.1, 0.2, 0.3]
+        response = {
+            'inference_results': [
+                {
+                    'output': [
+                        {'data': embedding}
+                    ]
+                }
+            ]
+        }
+
+        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.transport.perform_request.return_value = response
+
+            result = self.ingest.text_embedding(text)
+
+            self.assertEqual(result, embedding)
+            mock_opensearch_client.transport.perform_request.assert_called_once()
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_ml_models/test_BedrockModel.py b/tests/rag/test_ml_models/test_BedrockModel.py
new file mode 100644
index 00000000..dd32704c
--- /dev/null
+++ b/tests/rag/test_ml_models/test_BedrockModel.py
@@ -0,0 +1,116 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import Mock, patch, call
+import json
+from io import StringIO
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import BedrockModel
+
+class TestBedrockModel(unittest.TestCase):
+
+    def setUp(self):
+        self.aws_region = "us-west-2"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_username = "test-user"
+        self.opensearch_password = "test-password"
+        self.mock_iam_role_helper = Mock()
+        self.bedrock_model = BedrockModel(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.mock_iam_role_helper
+        )
+
+    def test_init(self):
+        self.assertEqual(self.bedrock_model.aws_region, self.aws_region)
+        self.assertEqual(self.bedrock_model.opensearch_domain_name, self.opensearch_domain_name)
+        self.assertEqual(self.bedrock_model.opensearch_username, self.opensearch_username)
+        self.assertEqual(self.bedrock_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(self.bedrock_model.iam_role_helper, self.mock_iam_role_helper)
+
+    @patch('builtins.input', side_effect=['', '1'])
+    def test_register_bedrock_model_default(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_role.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = "test-model-id"
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.bedrock_model.register_bedrock_model(mock_helper, mock_config, mock_save_config)
+
+        mock_helper.create_connector_with_role.assert_called_once()
+        mock_helper.create_model.assert_called_once()
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    @patch('builtins.input', side_effect=['custom-region', '2', '{"name": "Custom Model", "description": "Custom description"}'])
+    def test_register_bedrock_model_custom(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_role.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = "test-model-id"
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.bedrock_model.register_bedrock_model(mock_helper, mock_config, mock_save_config)
+
+        mock_helper.create_connector_with_role.assert_called_once()
+        mock_helper.create_model.assert_called_once_with("Custom Model", "Custom description", "test-connector-id", "my_test_create_bedrock_connector_role")
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    def test_save_model_id(self):
+        mock_config = {}
+        mock_save_config = Mock()
+        self.bedrock_model.save_model_id(mock_config, mock_save_config, "test-model-id")
+        self.assertEqual(mock_config, {'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(mock_config)
+
+    @patch('builtins.input', return_value='1')
+    def test_get_custom_model_details_default(self, mock_input):
+        default_input = {"name": "Default Model"}
+        result = self.bedrock_model.get_custom_model_details(default_input)
+        self.assertEqual(result, default_input)
+
+    @patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}'])
+    def test_get_custom_model_details_custom(self, mock_input):
+        default_input = {"name": "Default Model"}
+        result = self.bedrock_model.get_custom_model_details(default_input)
+        self.assertEqual(result, {"name": "Custom Model"})
+
+
+    @patch('builtins.input', return_value='2\n{invalid json}')
+    def test_get_custom_model_details_invalid_json(self, mock_input):
+        default_input = {"name": "Default Model"}
+        result = self.bedrock_model.get_custom_model_details(default_input)
+        self.assertIsNone(result)
+
+    @patch('builtins.input', return_value='3')
+    def test_get_custom_model_details_invalid_choice(self, mock_input):
+        default_input = {"name": "Default Model"}
+        result = self.bedrock_model.get_custom_model_details(default_input)
+        self.assertIsNone(result)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_ml_models/test_CohereModel.py b/tests/rag/test_ml_models/test_CohereModel.py
new file mode 100644
index 00000000..79b9f662
--- /dev/null
+++ b/tests/rag/test_ml_models/test_CohereModel.py
@@ -0,0 +1,158 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import Mock, patch, call
+import json
+from io import StringIO
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import CohereModel
+
+class TestCohereModel(unittest.TestCase):
+
+    def setUp(self):
+        self.aws_region = "us-west-2"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_username = "test-user"
+        self.opensearch_password = "test-password"
+        self.mock_iam_role_helper = Mock()
+        self.cohere_model = CohereModel(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.mock_iam_role_helper
+        )
+
+    def test_init(self):
+        self.assertEqual(self.cohere_model.aws_region, self.aws_region)
+        self.assertEqual(self.cohere_model.opensearch_domain_name, self.opensearch_domain_name)
+        self.assertEqual(self.cohere_model.opensearch_username, self.opensearch_username)
+        self.assertEqual(self.cohere_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(self.cohere_model.iam_role_helper, self.mock_iam_role_helper)
+
+    @patch('builtins.input', side_effect=['test-secret', 'test-api-key', '1'])
+    def test_register_cohere_model(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_secret.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = "test-model-id"
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.cohere_model.register_cohere_model(mock_helper, mock_config, mock_save_config)
+
+        mock_helper.create_connector_with_secret.assert_called_once()
+        mock_helper.create_model.assert_called_once()
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    @patch('builtins.input', side_effect=['test-api-key', '1'])
+    @patch('time.time', return_value=1000000)
+    def test_register_cohere_model_opensource(self, mock_time, mock_input):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'connector_id': 'test-connector-id'},
+            {'model_group_id': 'test-model-group-id'},
+            {'task_id': 'test-task-id'},
+            {'state': 'COMPLETED', 'model_id': 'test-model-id'},
+            {}  # for model deployment
+        ]
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.cohere_model.register_cohere_model_opensource(mock_opensearch_client, mock_config, mock_save_config)
+
+        self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 5)
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    def test_get_custom_model_details_default(self):
+        with patch('builtins.input', return_value='1'):
+            default_input = {"name": "Default Model"}
+            result = self.cohere_model.get_custom_model_details(default_input)
+            self.assertEqual(result, default_input)
+
+    def test_get_custom_model_details_custom(self):
+        with patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}']):
+            default_input = {"name": "Default Model"}
+            result = self.cohere_model.get_custom_model_details(default_input)
+            self.assertEqual(result, {"name": "Custom Model"})
+
+    def test_get_custom_model_details_invalid_json(self):
+        with patch('builtins.input', side_effect=['2', 'invalid json']):
+            default_input = {"name": "Default Model"}
+            result = self.cohere_model.get_custom_model_details(default_input)
+            self.assertIsNone(result)
+
+    def test_get_custom_model_details_invalid_choice(self):
+        with patch('builtins.input', return_value='3'):
+            default_input = {"name": "Default Model"}
+            result = self.cohere_model.get_custom_model_details(default_input)
+            self.assertIsNone(result)
+
+    def test_get_custom_json_input_valid(self):
+        with patch('builtins.input', return_value='{"key": "value"}'):
+            result = self.cohere_model.get_custom_json_input()
+            self.assertEqual(result, {"key": "value"})
+
+    def test_get_custom_json_input_invalid(self):
+        with patch('builtins.input', return_value='invalid json'):
+            result = self.cohere_model.get_custom_json_input()
+            self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'RUNNING'},
+            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+        ]
+        
+        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertEqual(result, 'test-model-id')
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'FAILED'}
+        ]
+        
+        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 1000])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
+        
+        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        self.assertIsNone(result)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_ml_models/test_OpenAIModel.py b/tests/rag/test_ml_models/test_OpenAIModel.py
new file mode 100644
index 00000000..1dc6f6f7
--- /dev/null
+++ b/tests/rag/test_ml_models/test_OpenAIModel.py
@@ -0,0 +1,157 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import Mock, patch, call
+import json
+from io import StringIO
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import OpenAIModel
+
+class TestOpenAIModel(unittest.TestCase):
+
+    def setUp(self):
+        self.aws_region = "us-west-2"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_username = "test-user"
+        self.opensearch_password = "test-password"
+        self.mock_iam_role_helper = Mock()
+        self.openai_model = OpenAIModel(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.mock_iam_role_helper
+        )
+
+    def test_init(self):
+        self.assertEqual(self.openai_model.aws_region, self.aws_region)
+        self.assertEqual(self.openai_model.opensearch_domain_name, self.opensearch_domain_name)
+        self.assertEqual(self.openai_model.opensearch_username, self.opensearch_username)
+        self.assertEqual(self.openai_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(self.openai_model.iam_role_helper, self.mock_iam_role_helper)
+
+    @patch('builtins.input', side_effect=['test-secret', 'test-api-key', '1'])
+    def test_register_openai_model(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_secret.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = "test-model-id"
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.openai_model.register_openai_model(mock_helper, mock_config, mock_save_config)
+
+        mock_helper.create_connector_with_secret.assert_called_once()
+        mock_helper.create_model.assert_called_once()
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    @patch('builtins.input', side_effect=['test-api-key', '1'])
+    @patch('time.time', return_value=1000000)
+    def test_register_openai_model_opensource(self, mock_time, mock_input):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'connector_id': 'test-connector-id'},
+            {'model_group_id': 'test-model-group-id'},
+            {'task_id': 'test-task-id'},
+            {'state': 'COMPLETED', 'model_id': 'test-model-id'},
+            {}  # for model deployment
+        ]
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.openai_model.register_openai_model_opensource(mock_opensearch_client, mock_config, mock_save_config)
+
+        self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 5)
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    def test_get_custom_model_details_default(self):
+        with patch('builtins.input', return_value='1'):
+            default_input = {"name": "Default Model"}
+            result = self.openai_model.get_custom_model_details(default_input)
+            self.assertEqual(result, default_input)
+
+    def test_get_custom_model_details_custom(self):
+        with patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}']):
+            default_input = {"name": "Default Model"}
+            result = self.openai_model.get_custom_model_details(default_input)
+            self.assertEqual(result, {"name": "Custom Model"})
+
+    def test_get_custom_model_details_invalid_json(self):
+        with patch('builtins.input', side_effect=['2', 'invalid json']):
+            default_input = {"name": "Default Model"}
+            result = self.openai_model.get_custom_model_details(default_input)
+            self.assertIsNone(result)
+
+    def test_get_custom_model_details_invalid_choice(self):
+        with patch('builtins.input', return_value='3'):
+            default_input = {"name": "Default Model"}
+            result = self.openai_model.get_custom_model_details(default_input)
+            self.assertIsNone(result)
+
+    def test_get_custom_json_input_valid(self):
+        with patch('builtins.input', return_value='{"key": "value"}'):
+            result = self.openai_model.get_custom_json_input()
+            self.assertEqual(result, {"key": "value"})
+
+    def test_get_custom_json_input_invalid(self):
+        with patch('builtins.input', return_value='invalid json'):
+            result = self.openai_model.get_custom_json_input()
+            self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'RUNNING'},
+            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+        ]
+        
+        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertEqual(result, 'test-model-id')
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'FAILED'}
+        ]
+        
+        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 1000])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
+        
+        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        self.assertIsNone(result)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_ml_models/test_PyTorchModel.py b/tests/rag/test_ml_models/test_PyTorchModel.py
new file mode 100644
index 00000000..6733315d
--- /dev/null
+++ b/tests/rag/test_ml_models/test_PyTorchModel.py
@@ -0,0 +1,162 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import Mock, patch, call, mock_open
+import json
+from io import StringIO
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import CustomPyTorchModel
+
+class TestCustomPyTorchModel(unittest.TestCase):
+
+    def setUp(self):
+        self.aws_region = "us-west-2"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_username = "test-user"
+        self.opensearch_password = "test-password"
+        self.mock_iam_role_helper = Mock()
+        self.custom_pytorch_model = CustomPyTorchModel(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.mock_iam_role_helper
+        )
+
+    def test_init(self):
+        self.assertEqual(self.custom_pytorch_model.aws_region, self.aws_region)
+        self.assertEqual(self.custom_pytorch_model.opensearch_domain_name, self.opensearch_domain_name)
+        self.assertEqual(self.custom_pytorch_model.opensearch_username, self.opensearch_username)
+        self.assertEqual(self.custom_pytorch_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(self.custom_pytorch_model.iam_role_helper, self.mock_iam_role_helper)
+
+    @patch('builtins.input', side_effect=['1', '/path/to/model.pt'])
+    @patch('os.path.isfile', return_value=True)
+    @patch('builtins.open', new_callable=mock_open, read_data=b'model_content')
+    def test_register_custom_pytorch_model_default(self, mock_file, mock_isfile, mock_input):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'model_id': 'uploaded_model_id'},
+            {'task_id': 'test-task-id'},
+            {'state': 'COMPLETED', 'model_id': 'registered_model_id'},
+            {}  # for model deployment
+        ]
+        
+        mock_config = {'embedding_dimension': 768}
+        mock_save_config = Mock()
+
+        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+
+        self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 4)
+        mock_save_config.assert_called_once_with({'embedding_dimension': 768, 'embedding_model_id': 'registered_model_id'})
+
+    @patch('builtins.input', side_effect=['2', '/path/to/model.pt', '{"name": "custom_model", "model_format": "TORCH_SCRIPT", "model_config": {"embedding_dimension": 512, "framework_type": "CUSTOM", "model_type": "bert"}, "description": "Custom model"}'])
+    @patch('os.path.isfile', return_value=True)
+    @patch('builtins.open', new_callable=mock_open, read_data=b'model_content')
+    def test_register_custom_pytorch_model_custom(self, mock_file, mock_isfile, mock_input):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'model_id': 'uploaded_model_id'},
+            {'task_id': 'test-task-id'},
+            {'state': 'COMPLETED', 'model_id': 'registered_model_id'},
+            {}  # for model deployment
+        ]
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+
+        self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 4)
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'registered_model_id'})
+
+    @patch('builtins.input', side_effect=['1', '/nonexistent/path.pt'])
+    @patch('os.path.isfile', return_value=False)
+    def test_register_custom_pytorch_model_file_not_found(self, mock_isfile, mock_input):
+        mock_opensearch_client = Mock()
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+
+        mock_opensearch_client.transport.perform_request.assert_not_called()
+        mock_save_config.assert_not_called()
+
+    @patch('builtins.input', return_value='3')
+    def test_register_custom_pytorch_model_invalid_choice(self, mock_input):
+        mock_opensearch_client = Mock()
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+
+        mock_opensearch_client.transport.perform_request.assert_not_called()
+        mock_save_config.assert_not_called()
+
+    def test_get_custom_json_input_valid(self):
+        with patch('builtins.input', return_value='{"key": "value"}'):
+            result = self.custom_pytorch_model.get_custom_json_input()
+            self.assertEqual(result, {"key": "value"})
+
+    def test_get_custom_json_input_invalid(self):
+        with patch('builtins.input', return_value='invalid json'):
+            result = self.custom_pytorch_model.get_custom_json_input()
+            self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'RUNNING'},
+            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+        ]
+        
+        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertEqual(result, 'test-model-id')
+
+    @patch('time.time', side_effect=[0, 10, 20, 30])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.side_effect = [
+            {'state': 'RUNNING'},
+            {'state': 'FAILED'}
+        ]
+        
+        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+        self.assertIsNone(result)
+
+    @patch('time.time', side_effect=[0, 1000])
+    @patch('time.sleep', return_value=None)
+    def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
+        mock_opensearch_client = Mock()
+        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
+        
+        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        self.assertIsNone(result)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_ml_models/test_SageMakerModel.py b/tests/rag/test_ml_models/test_SageMakerModel.py
new file mode 100644
index 00000000..1041f28e
--- /dev/null
+++ b/tests/rag/test_ml_models/test_SageMakerModel.py
@@ -0,0 +1,137 @@
+
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import Mock, patch, call
+import json
+from io import StringIO
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.SageMakerModel import SageMakerModel
+
+class TestSageMakerModel(unittest.TestCase):
+
+    def setUp(self):
+        self.aws_region = "us-west-2"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_username = "test-user"
+        self.opensearch_password = "test-password"
+        self.mock_iam_role_helper = Mock()
+        self.sagemaker_model = SageMakerModel(
+            self.aws_region,
+            self.opensearch_domain_name,
+            self.opensearch_username,
+            self.opensearch_password,
+            self.mock_iam_role_helper
+        )
+
+    def test_init(self):
+        self.assertEqual(self.sagemaker_model.aws_region, self.aws_region)
+        self.assertEqual(self.sagemaker_model.opensearch_domain_name, self.opensearch_domain_name)
+        self.assertEqual(self.sagemaker_model.opensearch_username, self.opensearch_username)
+        self.assertEqual(self.sagemaker_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(self.sagemaker_model.iam_role_helper, self.mock_iam_role_helper)
+
+    @patch('builtins.input', side_effect=[
+        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
+        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
+        ''  # Empty string for region, to use default
+    ])
+    def test_register_sagemaker_model(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_role.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = "test-model-id"
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+
+        # Check if create_connector_with_role was called
+        mock_helper.create_connector_with_role.assert_called_once()
+        call_args, call_kwargs = mock_helper.create_connector_with_role.call_args
+
+        # Check the arguments without assuming a specific order or number
+        self.assertIn("my_test_sagemaker_connector_role", call_args)
+        self.assertIn("my_test_create_sagemaker_connector_role", call_args)
+
+        # Check the inline policy
+        inline_policy = next(arg for arg in call_args if isinstance(arg, dict) and 'Statement' in arg)
+        self.assertEqual(inline_policy['Statement'][0]['Action'], ["sagemaker:InvokeEndpoint"])
+        self.assertEqual(inline_policy['Statement'][0]['Resource'], 
+                        "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint")
+
+        # Check the connector input
+        connector_input = next(arg for arg in call_args if isinstance(arg, dict) and 'name' in arg)
+        self.assertEqual(connector_input['name'], "SageMaker Embedding Model Connector")
+        self.assertEqual(connector_input['parameters']['region'], "us-west-2")
+        self.assertEqual(connector_input['actions'][0]['url'], 
+                        "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations")
+
+        # Check if create_model was called with correct arguments
+        mock_helper.create_model.assert_called_once_with(
+            "SageMaker Embedding Model",
+            "SageMaker embedding model for semantic search",
+            "test-connector-id",
+            "my_test_create_sagemaker_connector_role"
+        )
+
+        # Check if config was saved correctly
+        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+
+    @patch('builtins.input', side_effect=[
+        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
+        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
+        ''  # Empty string for region, to use default
+    ])
+    def test_register_sagemaker_model_connector_creation_failure(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_role.return_value = None
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+
+        mock_helper.create_model.assert_not_called()
+        mock_save_config.assert_not_called()
+
+    @patch('builtins.input', side_effect=[
+        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
+        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
+        ''  # Empty string for region, to use default
+    ])
+    def test_register_sagemaker_model_model_creation_failure(self, mock_input):
+        mock_helper = Mock()
+        mock_helper.create_connector_with_role.return_value = "test-connector-id"
+        mock_helper.create_model.return_value = None
+        
+        mock_config = {}
+        mock_save_config = Mock()
+
+        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+
+        mock_save_config.assert_not_called()
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_opensearch_connector.py b/tests/rag/test_opensearch_connector.py
new file mode 100644
index 00000000..25f5364f
--- /dev/null
+++ b/tests/rag/test_opensearch_connector.py
@@ -0,0 +1,249 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import patch, MagicMock, Mock
+from opensearchpy import OpenSearch, AWSV4SignerAuth, exceptions as opensearch_exceptions
+from urllib.parse import urlparse
+from opensearchpy import RequestsHttpConnection
+
+# Adjust the import to match your project structure
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
+
+class TestOpenSearchConnector(unittest.TestCase):
+    def setUp(self):
+        # Sample configuration
+        self.config = {
+            'region': 'us-east-1',
+            'index_name': 'test-index',
+            'is_serverless': 'False',
+            'opensearch_endpoint': 'https://search-example.us-east-1.es.amazonaws.com',
+            'opensearch_username': 'admin',
+            'opensearch_password': 'admin',
+            'service_type': 'managed',
+        }
+
+        # Update the patch target to match the actual import location
+        self.patcher_opensearch = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector.OpenSearch')
+        self.MockOpenSearch = self.patcher_opensearch.start()
+
+        # Mocked OpenSearch client instance
+        self.mock_opensearch_client = MagicMock()
+        self.MockOpenSearch.return_value = self.mock_opensearch_client
+
+        # Patch boto3 Session
+        self.patcher_boto3_session = patch('boto3.Session')
+        self.MockBoto3Session = self.patcher_boto3_session.start()
+
+        # Mocked boto3 credentials
+        self.mock_credentials = Mock()
+        self.MockBoto3Session.return_value.get_credentials.return_value = self.mock_credentials
+
+    def tearDown(self):
+        self.patcher_opensearch.stop()
+        self.patcher_boto3_session.stop()
+
+    def test_initialize_opensearch_client_managed(self):
+        connector = OpenSearchConnector(self.config)
+        result = connector.initialize_opensearch_client()
+        self.assertTrue(result)
+        self.MockOpenSearch.assert_called_once()
+        self.MockOpenSearch.assert_called_with(
+            hosts=[{'host': 'search-example.us-east-1.es.amazonaws.com', 'port': 443}],
+            http_auth=('admin', 'admin'),
+            use_ssl=True,
+            verify_certs=False,
+            connection_class=RequestsHttpConnection,
+            pool_maxsize=20
+        )
+
+    def test_initialize_opensearch_client_serverless(self):
+        self.config['service_type'] = 'serverless'
+        connector = OpenSearchConnector(self.config)
+        result = connector.initialize_opensearch_client()
+        self.assertTrue(result)
+        self.MockOpenSearch.assert_called_once()
+        # Check that AWSV4SignerAuth is used
+        args, kwargs = self.MockOpenSearch.call_args
+        self.assertIsInstance(kwargs['http_auth'], AWSV4SignerAuth)
+
+    def test_initialize_opensearch_client_missing_endpoint(self):
+        self.config['opensearch_endpoint'] = ''
+        connector = OpenSearchConnector(self.config)
+        with patch('builtins.print') as mock_print:
+            result = connector.initialize_opensearch_client()
+            self.assertFalse(result)
+            mock_print.assert_called_with("OpenSearch endpoint not set. Please run setup first.")
+
+    def test_create_index_success(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        connector.create_index(embedding_dimension=768, space_type='cosinesimil')
+        self.mock_opensearch_client.indices.create.assert_called_once()
+
+    def test_create_index_already_exists(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        # Simulate index already exists exception
+        self.mock_opensearch_client.indices.create.side_effect = opensearch_exceptions.RequestError(
+            '400', 'resource_already_exists_exception', 'Index already exists'
+        )
+        with patch('builtins.print') as mock_print:
+            connector.create_index(embedding_dimension=768, space_type='cosinesimil')
+            mock_print.assert_called_with(f"Index '{self.config['index_name']}' already exists.")
+
+    def test_create_index_other_exception(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        # Simulate a different exception
+        self.mock_opensearch_client.indices.create.side_effect = opensearch_exceptions.RequestError(
+            '400', 'some_other_exception', 'Some other error'
+        )
+        with patch('builtins.print') as mock_print:
+            connector.create_index(embedding_dimension=768, space_type='cosinesimil')
+            expected_message = f"Error creating index '{self.config['index_name']}': RequestError(400, 'some_other_exception')"
+            mock_print.assert_called_with(expected_message)
+
+    def test_verify_and_create_index_exists(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.indices.exists.return_value = True
+        with patch('builtins.print') as mock_print:
+            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+            self.assertTrue(result)
+            mock_print.assert_called_with(f"KNN index '{self.config['index_name']}' already exists.")
+
+    def test_verify_and_create_index_not_exists(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.indices.exists.return_value = False
+        with patch.object(connector, 'create_index') as mock_create_index:
+            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+            self.assertTrue(result)
+            mock_create_index.assert_called_once_with(768, 'cosinesimil')
+
+    def test_verify_and_create_index_exception(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.indices.exists.side_effect = Exception('Connection error')
+        with patch('builtins.print') as mock_print:
+            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+            self.assertFalse(result)
+            mock_print.assert_called_with("Error verifying or creating index: Connection error")
+
+    @patch('opensearchpy.helpers.bulk')
+    def test_bulk_index_success(self, mock_bulk):
+        mock_bulk.return_value = (100, [])
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
+        with patch('builtins.print') as mock_print:
+            success_count, error_count = connector.bulk_index(actions)
+            self.assertEqual(success_count, 100)
+            self.assertEqual(error_count, 0)
+            mock_print.assert_called_with("Indexed 100 documents successfully. Failed to index 0 documents.")
+
+    @patch('opensearchpy.helpers.bulk')
+    def test_bulk_index_with_errors(self, mock_bulk):
+        mock_bulk.return_value = (90, [{'index': {'_id': '10', 'error': 'Some error'}}])
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
+        with patch('builtins.print') as mock_print:
+            success_count, error_count = connector.bulk_index(actions)
+            self.assertEqual(success_count, 90)
+            self.assertEqual(error_count, 1)
+            mock_print.assert_called_with("Indexed 90 documents successfully. Failed to index 1 documents.")
+
+    @patch('opensearchpy.helpers.bulk')
+    def test_bulk_index_exception(self, mock_bulk):
+        mock_bulk.side_effect = Exception('Bulk indexing error')
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
+        with patch('builtins.print') as mock_print:
+            success_count, error_count = connector.bulk_index(actions)
+            self.assertEqual(success_count, 0)
+            self.assertEqual(error_count, 100)
+            mock_print.assert_called_with("Error during bulk indexing: Bulk indexing error")
+
+    def test_search_success(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        # Mock search response
+        self.mock_opensearch_client.search.return_value = {
+            'hits': {'hits': [{'id': 1}, {'id': 2}]}
+        }
+        results = connector.search(query_text='test', model_id='model-123', k=5)
+        self.assertEqual(results, [{'id': 1}, {'id': 2}])
+        self.mock_opensearch_client.search.assert_called_once()
+
+    def test_search_exception(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.search.side_effect = Exception('Search error')
+        with patch('builtins.print') as mock_print:
+            results = connector.search(query_text='test', model_id='model-123', k=5)
+            self.assertEqual(results, [])
+            mock_print.assert_called_with("Error during search: Search error")
+
+    def test_search_by_vector_success(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.search.return_value = {
+            'hits': {'hits': [{'id': 1}, {'id': 2}]}
+        }
+        results = connector.search_by_vector(vector=[0.1, 0.2, 0.3], k=5)
+        self.assertEqual(results, [{'id': 1}, {'id': 2}])
+        self.mock_opensearch_client.search.assert_called_once()
+
+    def test_search_by_vector_exception(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.search.side_effect = Exception('Vector search error')
+        with patch('builtins.print') as mock_print:
+            results = connector.search_by_vector(vector=[0.1, 0.2, 0.3], k=5)
+            self.assertEqual(results, [])
+            mock_print.assert_called_with("Error during search: Vector search error")
+
+    def test_check_connection_success(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        # Mock info method
+        self.mock_opensearch_client.info.return_value = {'version': {'number': '7.10.2'}}
+        result = connector.check_connection()
+        self.assertTrue(result)
+        self.mock_opensearch_client.info.assert_called_once()
+
+    def test_check_connection_failure(self):
+        connector = OpenSearchConnector(self.config)
+        connector.opensearch_client = self.mock_opensearch_client
+        self.mock_opensearch_client.info.side_effect = Exception('Connection error')
+        with patch('builtins.print') as mock_print:
+            result = connector.check_connection()
+            self.assertFalse(result)
+            mock_print.assert_called_with("Error connecting to OpenSearch: Connection error")
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_query.py b/tests/rag/test_query.py
new file mode 100644
index 00000000..d2e0cf99
--- /dev/null
+++ b/tests/rag/test_query.py
@@ -0,0 +1,278 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import patch, MagicMock
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.query import Query
+from opensearchpy import exceptions as opensearch_exceptions
+import json
+
+class TestQuery(unittest.TestCase):
+    def setUp(self):
+        # Patch 'print' to suppress output during tests
+        self.print_patcher = patch('builtins.print')
+        self.mock_print = self.print_patcher.start()
+
+        self.config = {
+            'index_name': 'test-index',
+            'embedding_model_id': 'test-embedding-model-id',
+            'llm_model_id': 'test-llm-model-id',
+            'region': 'us-east-1',
+            'default_search_method': 'neural',
+            'llm_max_token_count': '1000',
+            'llm_temperature': '0.7',
+            'llm_top_p': '0.9',
+            'llm_stop_sequences': ''
+        }
+        # Do not instantiate Query here to avoid unmocked initialization.
+
+    def tearDown(self):
+        # Stop the 'print' patcher
+        self.print_patcher.stop()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
+    def test_initialize_clients_success(self, mock_boto3_client, mock_opensearch_connector):
+        # Mock OpenSearch client initialization
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.check_connection.return_value = True
+
+        # Mock Bedrock client initialization
+        mock_bedrock_client = MagicMock()
+        mock_boto3_client.return_value = mock_bedrock_client
+
+        # Initialize Query instance after patches
+        query_instance = Query(self.config)
+
+        self.assertIsNotNone(query_instance.opensearch)
+        self.assertEqual(query_instance.bedrock_client, mock_bedrock_client)
+        mock_opensearch_connector_instance.initialize_opensearch_client.assert_called_once()
+        mock_boto3_client.assert_called_once_with('bedrock-runtime', region_name='us-east-1')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_initialize_clients_opensearch_failure(self, mock_opensearch_connector):
+        # Mock OpenSearch client initialization failure
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = False
+
+        # Since 'print' is mocked in setUp, we can use 'self.mock_print' to assert calls
+        query_instance = Query(self.config)
+        mock_opensearch_connector_instance.initialize_opensearch_client.assert_called_once()
+        self.mock_print.assert_any_call("Failed to initialize OpenSearch client.")
+        self.mock_print.assert_any_call("Failed to initialize clients. Aborting.")
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_extract_relevant_sentences(self, mock_opensearch_connector):
+        # Mock OpenSearch client to prevent initialization
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        query_instance = Query(self.config)
+        query_text = 'What is the capital of France?'
+        text = 'Paris is the capital of France. It is known for the Eiffel Tower.'
+        expected_sentences = ['Paris is the capital of France']
+
+        result = query_instance.extract_relevant_sentences(query_text, text)
+        self.assertIn(expected_sentences[0], result)
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_bulk_query_neural_success(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        queries = ['What is the capital of France?']
+        mock_hits = [
+            {
+                '_score': 1.0,
+                '_source': {'content': 'Paris is the capital of France.'}
+            }
+        ]
+        query_instance = Query(self.config)
+        with patch.object(query_instance.opensearch, 'search', return_value=mock_hits):
+            results = query_instance.bulk_query_neural(queries, k=1)
+            self.assertEqual(len(results), 1)
+            self.assertEqual(results[0]['num_results'], 1)
+            self.assertEqual(results[0]['documents'][0]['source']['content'], 'Paris is the capital of France.')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_bulk_query_neural_failure(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        queries = ['What is the capital of France?']
+        query_instance = Query(self.config)
+        with patch.object(query_instance.opensearch, 'search', side_effect=Exception('Search error')):
+            results = query_instance.bulk_query_neural(queries, k=1)
+            self.assertEqual(len(results), 1)
+            self.assertEqual(results[0]['num_results'], 0)
+            self.mock_print.assert_any_call("\x1b[31mError performing search for query 'What is the capital of France?': Search error\x1b[0m")
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_bulk_query_semantic_success(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        queries = ['What is the capital of France?']
+        embedding = [0.1, 0.2, 0.3]
+        mock_hits = [
+            {
+                '_score': 1.0,
+                '_source': {'nominee_text': 'Paris is the capital of France.'}
+            }
+        ]
+        query_instance = Query(self.config)
+        with patch.object(query_instance, 'text_embedding', return_value=embedding):
+            with patch.object(query_instance.opensearch, 'search_by_vector', return_value=mock_hits):
+                results = query_instance.bulk_query_semantic(queries, k=1)
+                self.assertEqual(len(results), 1)
+                self.assertEqual(results[0]['num_results'], 1)
+                self.assertIn('Paris is the capital of France.', results[0]['context'])
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_bulk_query_semantic_embedding_failure(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        queries = ['What is the capital of France?']
+        query_instance = Query(self.config)
+        with patch.object(query_instance, 'text_embedding', return_value=None):
+            results = query_instance.bulk_query_semantic(queries, k=1)
+            self.assertEqual(len(results), 1)
+            self.assertEqual(results[0]['num_results'], 0)
+            self.mock_print.assert_any_call('\x1b[31mFailed to generate embedding for query: What is the capital of France?\x1b[0m')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_text_embedding_success(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        text = 'Sample text'
+        embedding = [0.1, 0.2, 0.3]
+        response = {
+            'inference_results': [
+                {
+                    'output': [
+                        {'data': embedding}
+                    ]
+                }
+            ]
+        }
+        query_instance = Query(self.config)
+        with patch.object(query_instance.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.transport.perform_request.return_value = response
+
+            result = query_instance.text_embedding(text)
+            self.assertEqual(result, embedding)
+            mock_opensearch_client.transport.perform_request.assert_called_once()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_text_embedding_failure(self, mock_opensearch_connector):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        text = 'Sample text'
+        query_instance = Query(self.config)
+        with patch.object(query_instance.opensearch, 'opensearch_client') as mock_opensearch_client:
+            mock_opensearch_client.transport.perform_request.side_effect = Exception('Test exception')
+
+            with self.assertRaises(Exception) as context:
+                query_instance.text_embedding(text, max_retries=1)
+            self.assertTrue('Test exception' in str(context.exception))
+            self.mock_print.assert_any_call('Error on attempt 1: Test exception')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_generate_answer_success(self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        prompt = 'Sample prompt'
+        llm_config = {
+            'maxTokenCount': 100,
+            'temperature': 0.7,
+            'topP': 0.9,
+            'stopSequences': []
+        }
+        encoding_instance = MagicMock()
+        encoding_instance.encode.return_value = [1, 2, 3]
+        encoding_instance.decode.return_value = prompt
+        mock_get_encoding.return_value = encoding_instance
+
+        mock_bedrock_client = mock_boto3_client.return_value
+        response_stream = MagicMock()
+        response_stream.read.return_value = json.dumps({
+            'results': [
+                {'outputText': 'Generated answer'}
+            ]
+        })
+        response = {'body': response_stream}
+        mock_bedrock_client.invoke_model.return_value = response
+
+        query_instance = Query(self.config)
+        query_instance.bedrock_client = mock_bedrock_client  # Set the mocked bedrock client
+
+        answer = query_instance.generate_answer(prompt, llm_config)
+        self.assertEqual(answer, 'Generated answer')
+        mock_bedrock_client.invoke_model.assert_called_once()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    def test_generate_answer_failure(self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding):
+        # Mock OpenSearch client
+        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+
+        prompt = 'Sample prompt'
+        llm_config = {
+            'maxTokenCount': 100,
+            'temperature': 0.7,
+            'topP': 0.9,
+            'stopSequences': []
+        }
+        encoding_instance = MagicMock()
+        encoding_instance.encode.return_value = [1, 2, 3]
+        encoding_instance.decode.return_value = prompt
+        mock_get_encoding.return_value = encoding_instance
+
+        mock_bedrock_client = mock_boto3_client.return_value
+        mock_bedrock_client.invoke_model.side_effect = Exception('LLM error')
+
+        query_instance = Query(self.config)
+        query_instance.bedrock_client = mock_bedrock_client  # Set the mocked bedrock client
+
+        answer = query_instance.generate_answer(prompt, llm_config)
+        self.assertIsNone(answer)
+        self.mock_print.assert_any_call('Error generating answer from LLM: LLM error')
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file
diff --git a/tests/rag/test_rag.py b/tests/rag/test_rag.py
new file mode 100644
index 00000000..cf4c54d1
--- /dev/null
+++ b/tests/rag/test_rag.py
@@ -0,0 +1,166 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import patch, MagicMock, Mock
+import sys
+import argparse
+from io import StringIO
+from colorama import Fore, Style
+import warnings
+from urllib3.exceptions import InsecureRequestWarning
+
+# Suppress specific warnings
+warnings.filterwarnings("ignore", category=UserWarning)
+warnings.filterwarnings("ignore", category=DeprecationWarning)
+warnings.filterwarnings("ignore", category=InsecureRequestWarning)
+
+# Import the main function from rag.py
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag import main
+
+class TestRAGCLI(unittest.TestCase):
+    def setUp(self):
+        # Mock the config to avoid actual file operations
+        self.mock_config = {
+            'service_type': 'managed',
+            'region': 'us-west-2',
+            'default_search_method': 'neural',
+            # ... other config parameters ...
+        }
+
+        # Patch 'load_config' and 'save_config' functions
+        self.patcher_load_config = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.load_config', return_value=self.mock_config)
+        self.mock_load_config = self.patcher_load_config.start()
+        self.addCleanup(self.patcher_load_config.stop)
+
+        self.patcher_save_config = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.save_config')
+        self.mock_save_config = self.patcher_save_config.start()
+        self.addCleanup(self.patcher_save_config.stop)
+
+        # Patch 'Setup', 'Ingest', and 'Query' classes
+        self.patcher_setup = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Setup')
+        self.mock_setup_class = self.patcher_setup.start()
+        self.addCleanup(self.patcher_setup.stop)
+
+        self.patcher_ingest = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Ingest')
+        self.mock_ingest_class = self.patcher_ingest.start()
+        self.addCleanup(self.patcher_ingest.stop)
+
+        self.patcher_query = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Query')
+        self.mock_query_class = self.patcher_query.start()
+        self.addCleanup(self.patcher_query.stop)
+
+        # Capture stdout
+        self.held_stdout = StringIO()
+        self.patcher_stdout = patch('sys.stdout', new=self.held_stdout)
+        self.patcher_stdout.start()
+        self.addCleanup(self.patcher_stdout.stop)
+
+        # Capture stderr
+        self.held_stderr = StringIO()
+        self.patcher_stderr = patch('sys.stderr', new=self.held_stderr)
+        self.patcher_stderr.start()
+        self.addCleanup(self.patcher_stderr.stop)
+
+    def test_setup_command(self):
+        test_args = ['rag.py', 'setup']
+        with patch.object(sys, 'argv', test_args):
+            main()
+            # Ensure Setup.setup_command() is called
+            self.mock_setup_class.return_value.setup_command.assert_called_once()
+            # Ensure save_config is called
+            self.mock_save_config.assert_called_once_with(self.mock_setup_class.return_value.config)
+
+    def test_ingest_command_with_paths(self):
+        test_args = ['rag.py', 'ingest', '--paths', '/path/to/data1', '/path/to/data2']
+        with patch.object(sys, 'argv', test_args):
+            main()
+            # Ensure Ingest.ingest_command() is called with correct paths
+            self.mock_ingest_class.assert_called_once_with(self.mock_config)
+            self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(['/path/to/data1', '/path/to/data2'])
+
+    def test_ingest_command_without_paths(self):
+        test_args = ['rag.py', 'ingest']
+        with patch.object(sys, 'argv', test_args):
+            with patch('rich.prompt.Prompt.ask', side_effect=['/path/to/data', '']):
+                main()
+                # Ensure Ingest.ingest_command() is called with prompted paths
+                self.mock_ingest_class.assert_called_once_with(self.mock_config)
+                self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(['/path/to/data'])
+
+    def test_query_command_with_queries(self):
+        test_args = ['rag.py', 'query', '--queries', 'What is OpenSearch?', 'How does Bedrock work?']
+        with patch.object(sys, 'argv', test_args):
+            main()
+            # Ensure Query.query_command() is called with correct queries
+            self.mock_query_class.assert_called_once_with(self.mock_config)
+            self.mock_query_class.return_value.query_command.assert_called_once_with(
+                ['What is OpenSearch?', 'How does Bedrock work?'],
+                num_results=5
+            )
+
+    def test_query_command_without_queries(self):
+        test_args = ['rag.py', 'query']
+        with patch.object(sys, 'argv', test_args):
+            with patch('rich.prompt.Prompt.ask', side_effect=['What is OpenSearch?', '']):
+                main()
+                # Ensure Query.query_command() is called with prompted queries
+                self.mock_query_class.assert_called_once_with(self.mock_config)
+                self.mock_query_class.return_value.query_command.assert_called_once_with(['What is OpenSearch?'], num_results=5)
+
+    def test_query_command_with_num_results(self):
+        test_args = ['rag.py', 'query', '--queries', 'What is OpenSearch?', '--num_results', '3']
+        with patch.object(sys, 'argv', test_args):
+            main()
+            # Ensure Query.query_command() is called with correct num_results
+            self.mock_query_class.return_value.query_command.assert_called_once_with(
+                ['What is OpenSearch?'],
+                num_results=3
+            )
+
+    def test_no_command(self):
+        test_args = ['rag.py']
+        with patch.object(sys, 'argv', test_args):
+            with self.assertRaises(SystemExit) as cm:
+                main()
+            self.assertEqual(cm.exception.code, 1)
+            stderr_output = self.held_stderr.getvalue()
+            stdout_output = self.held_stdout.getvalue()
+            print("STDERR:", stderr_output)
+            print("STDOUT:", stdout_output)
+            self.assertTrue("usage: rag.py" in stderr_output or "usage: rag.py" in stdout_output)
+
+    def test_invalid_command(self):
+        test_args = ['rag.py', 'invalid']
+        with patch.object(sys, 'argv', test_args):
+            with self.assertRaises(SystemExit) as cm:
+                main()
+            self.assertEqual(cm.exception.code, 2)
+            stderr_output = self.held_stderr.getvalue()
+            stdout_output = self.held_stdout.getvalue()
+            print("STDERR:", stderr_output)
+            print("STDOUT:", stdout_output)
+            self.assertTrue("invalid choice: 'invalid'" in stderr_output or "invalid choice: 'invalid'" in stdout_output)
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
new file mode 100644
index 00000000..1cdc6b85
--- /dev/null
+++ b/tests/rag/test_rag_setup.py
@@ -0,0 +1,209 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+import unittest
+from unittest.mock import patch, MagicMock
+import os
+import configparser
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup import Setup
+from colorama import Fore, Style
+
+class TestSetup(unittest.TestCase):
+    def setUp(self):
+        # Sample configuration
+        self.sample_config = {
+            'service_type': 'managed',
+            'region': 'us-west-2',
+            'iam_principal': 'arn:aws:iam::123456789012:user/test-user',
+            'collection_name': 'test-collection',
+            'opensearch_endpoint': 'https://search-hashim-test5.us-west-2.es.amazonaws.com',
+            'opensearch_username': '*****',
+            'opensearch_password': 'password',
+            'default_search_method': 'neural',
+            'index_name': 'test-index',
+            'embedding_dimension': '768',
+            'space_type': 'cosinesimil',
+            'ef_construction': '512',
+        }
+
+        # Initialize Setup instance
+        self.setup_instance = Setup()
+
+        # Set index_name for tests
+        self.setup_instance.index_name = self.sample_config['index_name']
+
+        # Mock AWS clients
+        self.mock_boto3_client = patch('boto3.client').start()
+        self.addCleanup(patch.stopall)
+
+        # Mock OpenSearch client
+        self.mock_opensearch_client = MagicMock()
+        self.setup_instance.opensearch_client = self.mock_opensearch_client
+
+        # Mock os.path.exists
+        self.patcher_os_path_exists = patch('os.path.exists', return_value=True)
+        self.mock_os_path_exists = self.patcher_os_path_exists.start()
+        self.addCleanup(self.patcher_os_path_exists.stop)
+
+        # Mock configparser
+        self.patcher_configparser = patch('configparser.ConfigParser')
+        self.mock_configparser_class = self.patcher_configparser.start()
+        self.mock_configparser = MagicMock()
+        self.mock_configparser_class.return_value = self.mock_configparser
+        self.addCleanup(self.patcher_configparser.stop)
+
+    def test_load_config_existing(self):
+        with patch('os.path.exists', return_value=True):
+            self.mock_configparser.read.return_value = None
+            self.mock_configparser.__getitem__.return_value = self.sample_config
+            config = self.setup_instance.load_config()
+            self.assertEqual(config, self.sample_config)
+
+    def test_load_config_no_file(self):
+        with patch('os.path.exists', return_value=False):
+            self.mock_configparser.read.return_value = None
+            config = self.setup_instance.load_config()
+            self.assertEqual(config, {})
+
+    def test_save_config(self):
+        with patch('builtins.open', unittest.mock.mock_open()) as mock_file:
+            self.setup_instance.save_config(self.sample_config)
+            mock_file.assert_called_with(self.setup_instance.CONFIG_FILE, 'w')
+            self.mock_configparser.write.assert_called()
+
+    def test_get_opensearch_domain_name(self):
+        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
+            domain_name = self.setup_instance.get_opensearch_domain_name()
+            self.assertEqual(domain_name, 'hashim-test5')
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup.OpenSearch')
+    def test_initialize_opensearch_client_managed(self, mock_opensearch):
+        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
+            self.setup_instance = Setup()
+            self.setup_instance.opensearch_username = '*****'
+            self.setup_instance.opensearch_password = 'password'
+            result = self.setup_instance.initialize_opensearch_client()
+            self.assertTrue(result)
+            mock_opensearch.assert_called_once()
+
+    def test_initialize_opensearch_client_no_endpoint(self):
+        self.setup_instance.opensearch_endpoint = ''
+        with patch('builtins.print') as mock_print:
+            result = self.setup_instance.initialize_opensearch_client()
+            self.assertFalse(result)
+            mock_print.assert_called_with(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
+
+    def test_verify_and_create_index_exists(self):
+        self.setup_instance.index_name = self.sample_config['index_name']
+        self.mock_opensearch_client.indices.exists.return_value = True
+        with patch('builtins.print') as mock_print:
+            result = self.setup_instance.verify_and_create_index(768, 'cosinesimil', 512)
+            self.assertTrue(result)
+            mock_print.assert_called_with(f"{Fore.GREEN}KNN index '{self.setup_instance.index_name}' already exists.{Style.RESET_ALL}\n")
+
+    def test_verify_and_create_index_create(self):
+        self.setup_instance.index_name = self.sample_config['index_name']
+        self.mock_opensearch_client.indices.exists.return_value = False
+        self.setup_instance.create_index = MagicMock()
+        with patch('builtins.print') as mock_print:
+            result = self.setup_instance.verify_and_create_index(768, 'cosinesimil', 512)
+            self.assertTrue(result)
+            self.setup_instance.create_index.assert_called_with(768, 'cosinesimil', 512)
+
+    def test_create_index_success(self):
+        with patch('builtins.print') as mock_print:
+            self.setup_instance.create_index(768, 'cosinesimil', 512)
+            self.mock_opensearch_client.indices.create.assert_called_once()
+            mock_print.assert_called_with(f"\n{Fore.GREEN}KNN index '{self.setup_instance.index_name}' created successfully with dimension 768, space type cosinesimil, and ef_construction 512.{Style.RESET_ALL}\n")
+
+    def test_create_index_already_exists(self):
+        self.mock_opensearch_client.indices.create.side_effect = Exception('resource_already_exists_exception')
+        with patch('builtins.print') as mock_print:
+            self.setup_instance.create_index(768, 'cosinesimil', 512)
+            mock_print.assert_called_with(f"\n{Fore.YELLOW}Index '{self.setup_instance.index_name}' already exists.{Style.RESET_ALL}\n")
+
+    def test_get_knn_index_details_default(self):
+        with patch('builtins.input', side_effect=['', '', '']):
+            with patch('builtins.print'):
+                embedding_dimension, space_type, ef_construction = self.setup_instance.get_knn_index_details()
+                self.assertEqual(embedding_dimension, 768)
+                self.assertEqual(space_type, 'l2')
+                self.assertEqual(ef_construction, 512)
+
+    def test_get_truncated_name_within_limit(self):
+        name = 'short-name'
+        truncated_name = self.setup_instance.get_truncated_name(name, max_length=32)
+        self.assertEqual(truncated_name, name)
+
+    def test_get_truncated_name_exceeds_limit(self):
+        name = 'a' * 35
+        truncated_name = self.setup_instance.get_truncated_name(name, max_length=32)
+        self.assertEqual(truncated_name, 'a' * 29 + '...')
+
+    def test_initialize_clients_success(self):
+        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
+            self.setup_instance = Setup()
+            self.setup_instance.service_type = 'managed'
+            with patch('boto3.client') as mock_boto_client:
+                mock_boto_client.return_value = MagicMock()
+                with patch('time.sleep'):
+                    with patch('builtins.print') as mock_print:
+                        result = self.setup_instance.initialize_clients()
+                        self.assertTrue(result)
+                        mock_print.assert_called_with(f"{Fore.GREEN}AWS clients initialized successfully.{Style.RESET_ALL}\n")
+
+    def test_initialize_clients_failure(self):
+        self.setup_instance.service_type = 'managed'
+        with patch('boto3.client', side_effect=Exception('Initialization failed')):
+            with patch('builtins.print') as mock_print:
+                result = self.setup_instance.initialize_clients()
+                self.assertFalse(result)
+                mock_print.assert_called_with(f"{Fore.RED}Failed to initialize AWS clients: Initialization failed{Style.RESET_ALL}")
+
+    def test_check_and_configure_aws_already_configured(self):
+        with patch('boto3.Session') as mock_session:
+            mock_session.return_value.get_credentials.return_value = MagicMock()
+            with patch('builtins.input', return_value='no'):
+                with patch('builtins.print') as mock_print:
+                    self.setup_instance.check_and_configure_aws()
+                    mock_print.assert_called_with("AWS credentials are already configured.")
+
+    def test_check_and_configure_aws_not_configured(self):
+        with patch('boto3.Session') as mock_session:
+            mock_session.return_value.get_credentials.return_value = None
+            self.setup_instance.configure_aws = MagicMock()
+            with patch('builtins.print'):
+                self.setup_instance.check_and_configure_aws()
+                self.setup_instance.configure_aws.assert_called_once()
+
+    def test_configure_aws(self):
+        with patch('builtins.input', side_effect=['AKIA...', 'SECRET...', 'us-west-2']):
+            with patch('subprocess.run') as mock_subprocess_run:
+                with patch('builtins.print') as mock_print:
+                    self.setup_instance.configure_aws()
+                    self.assertEqual(mock_subprocess_run.call_count, 3)
+                    mock_print.assert_called_with(f"{Fore.GREEN}AWS credentials have been successfully configured.{Style.RESET_ALL}")
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/rag/test_serverless.py b/tests/rag/test_serverless.py
new file mode 100644
index 00000000..e6d89608
--- /dev/null
+++ b/tests/rag/test_serverless.py
@@ -0,0 +1,232 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+#  Licensed to Elasticsearch B.V. under one or more contributor
+#  license agreements. See the NOTICE file distributed with
+#  this work for additional information regarding copyright
+#  ownership. Elasticsearch B.V. licenses this file to you under
+#  the Apache License, Version 2.0 (the "License"); you may
+#  not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+# 	http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+import unittest
+from unittest.mock import patch, MagicMock, Mock
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless
+from colorama import Fore, Style
+
+class TestServerless(unittest.TestCase):
+    def setUp(self):
+        # Sample data
+        self.collection_name = 'test-collection'
+        self.iam_principal = 'arn:aws:iam::123456789012:user/test-user'
+        self.aws_region = 'us-east-1'
+
+        # Mock aoss_client
+        self.aoss_client = MagicMock()
+
+        # Define a custom ConflictException class
+        class ConflictException(Exception):
+            pass
+
+        # Mock exceptions
+        self.aoss_client.exceptions = MagicMock()
+        self.aoss_client.exceptions.ConflictException = ConflictException
+
+        # Initialize the Serverless instance
+        self.serverless = Serverless(
+            aoss_client=self.aoss_client,
+            collection_name=self.collection_name,
+            iam_principal=self.iam_principal,
+            aws_region=self.aws_region
+        )
+
+        # Mock sleep to speed up tests
+        self.sleep_patcher = patch('time.sleep', return_value=None)
+        self.mock_sleep = self.sleep_patcher.start()
+
+    def tearDown(self):
+        self.sleep_patcher.stop()
+
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_access_policy')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_security_policy')
+    def test_create_security_policies_success(self, mock_create_security_policy, mock_create_access_policy):
+        self.serverless.create_security_policies()
+        # Check that create_security_policy is called twice (encryption and network)
+        self.assertEqual(mock_create_security_policy.call_count, 2)
+        # Check that create_access_policy is called once
+        mock_create_access_policy.assert_called_once()
+
+    def test_create_security_policy_success(self):
+        policy_type = 'encryption'
+        name = 'test-enc-policy'
+        description = 'Test encryption policy'
+        policy_body = '{}'
+        self.aoss_client.create_security_policy.return_value = {}
+        with patch('builtins.print') as mock_print:
+            self.serverless.create_security_policy(policy_type, name, description, policy_body)
+            self.aoss_client.create_security_policy.assert_called_with(
+                description=description,
+                name=name,
+                policy=policy_body,
+                type=policy_type
+            )
+            mock_print.assert_called_with(f"{Fore.GREEN}Encryption Policy '{name}' created successfully.{Style.RESET_ALL}")
+
+    def test_create_security_policy_conflict(self):
+        policy_type = 'network'
+        name = 'test-net-policy'
+        description = 'Test network policy'
+        policy_body = '{}'
+        # Simulate ConflictException
+        conflict_exception = self.aoss_client.exceptions.ConflictException()
+        self.aoss_client.create_security_policy.side_effect = conflict_exception
+        with patch('builtins.print') as mock_print:
+            self.serverless.create_security_policy(policy_type, name, description, policy_body)
+            mock_print.assert_called_with(f"{Fore.YELLOW}Network Policy '{name}' already exists.{Style.RESET_ALL}")
+
+    def test_create_security_policy_exception(self):
+        policy_type = 'invalid'
+        name = 'test-policy'
+        description = 'Test policy'
+        policy_body = '{}'
+        with patch('builtins.print') as mock_print:
+            self.serverless.create_security_policy(policy_type, name, description, policy_body)
+            mock_print.assert_called_with(f"{Fore.RED}Error creating {policy_type} policy '{name}': Invalid policy type specified.{Style.RESET_ALL}")
+
+    def test_create_access_policy_success(self):
+        name = 'test-access-policy'
+        description = 'Test access policy'
+        policy_body = '{}'
+        self.aoss_client.create_access_policy.return_value = {}
+        with patch('builtins.print') as mock_print:
+            self.serverless.create_access_policy(name, description, policy_body)
+            self.aoss_client.create_access_policy.assert_called_with(
+                description=description,
+                name=name,
+                policy=policy_body,
+                type='data'
+            )
+            mock_print.assert_called_with(f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n")
+
+    def test_create_access_policy_conflict(self):
+        name = 'test-access-policy'
+        description = 'Test access policy'
+        policy_body = '{}'
+        # Simulate ConflictException
+        conflict_exception = self.aoss_client.exceptions.ConflictException()
+        self.aoss_client.create_access_policy.side_effect = conflict_exception
+        with patch('builtins.print') as mock_print:
+            self.serverless.create_access_policy(name, description, policy_body)
+            mock_print.assert_called_with(f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n")
+
+    def test_create_collection_success(self):
+        self.aoss_client.create_collection.return_value = {
+            'createCollectionDetail': {'id': 'collection-id-123'}
+        }
+        with patch('builtins.print') as mock_print:
+            collection_id = self.serverless.create_collection(self.collection_name)
+            self.assertEqual(collection_id, 'collection-id-123')
+            mock_print.assert_called_with(f"{Fore.GREEN}Collection '{self.collection_name}' creation initiated.{Style.RESET_ALL}")
+
+    def test_create_collection_conflict(self):
+        # Simulate ConflictException
+        conflict_exception = self.aoss_client.exceptions.ConflictException()
+        self.aoss_client.create_collection.side_effect = conflict_exception
+        self.serverless.get_collection_id = MagicMock(return_value='existing-collection-id')
+        with patch('builtins.print') as mock_print:
+            collection_id = self.serverless.create_collection(self.collection_name)
+            self.assertEqual(collection_id, 'existing-collection-id')
+            mock_print.assert_called_with(f"{Fore.YELLOW}Collection '{self.collection_name}' already exists.{Style.RESET_ALL}")
+
+    def test_create_collection_exception_retry(self):
+        # Simulate Exception on first two attempts, success on third
+        self.aoss_client.create_collection.side_effect = [
+            Exception('Temporary error'),
+            Exception('Temporary error'),
+            {'createCollectionDetail': {'id': 'collection-id-123'}}
+        ]
+        with patch('builtins.print'):
+            collection_id = self.serverless.create_collection(self.collection_name, max_retries=3)
+            self.assertEqual(collection_id, 'collection-id-123')
+            self.assertEqual(self.aoss_client.create_collection.call_count, 3)
+
+    def test_get_collection_id_success(self):
+        self.aoss_client.list_collections.return_value = {
+            'collectionSummaries': [
+                {'name': 'other-collection', 'id': 'other-id'},
+                {'name': self.collection_name, 'id': 'collection-id-123'}
+            ]
+        }
+        collection_id = self.serverless.get_collection_id(self.collection_name)
+        self.assertEqual(collection_id, 'collection-id-123')
+
+    def test_get_collection_id_not_found(self):
+        self.aoss_client.list_collections.return_value = {
+            'collectionSummaries': [
+                {'name': 'other-collection', 'id': 'other-id'}
+            ]
+        }
+        collection_id = self.serverless.get_collection_id(self.collection_name)
+        self.assertIsNone(collection_id)
+
+    def test_wait_for_collection_active_success(self):
+        collection_id = 'collection-id-123'
+        # Simulate 'CREATING' status, then 'ACTIVE'
+        self.aoss_client.batch_get_collection.side_effect = [
+            {'collectionDetails': [{'status': 'CREATING'}]},
+            {'collectionDetails': [{'status': 'ACTIVE'}]}
+        ]
+        with patch('builtins.print'):
+            result = self.serverless.wait_for_collection_active(collection_id, max_wait_minutes=1)
+            self.assertTrue(result)
+            self.assertEqual(self.aoss_client.batch_get_collection.call_count, 2)
+
+    def test_wait_for_collection_active_timeout(self):
+        collection_id = 'collection-id-123'
+        # Simulate 'CREATING' status indefinitely
+        self.aoss_client.batch_get_collection.return_value = {'collectionDetails': [{'status': 'CREATING'}]}
+        with patch('builtins.print'):
+            result = self.serverless.wait_for_collection_active(collection_id, max_wait_minutes=0.01)
+            self.assertFalse(result)
+
+    def test_get_collection_endpoint_success(self):
+        collection_id = 'collection-id-123'
+        self.serverless.get_collection_id = MagicMock(return_value=collection_id)
+        self.aoss_client.batch_get_collection.return_value = {
+            'collectionDetails': [{'collectionEndpoint': 'https://example-endpoint.com'}]
+        }
+        with patch('builtins.print'):
+            endpoint = self.serverless.get_collection_endpoint()
+            self.assertEqual(endpoint, 'https://example-endpoint.com')
+
+    def test_get_collection_endpoint_collection_not_found(self):
+        self.serverless.get_collection_id = MagicMock(return_value=None)
+        with patch('builtins.print') as mock_print:
+            endpoint = self.serverless.get_collection_endpoint()
+            self.assertIsNone(endpoint)
+            mock_print.assert_called_with(f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n")
+
+    def test_get_truncated_name_within_limit(self):
+        name = 'short-name'
+        truncated_name = self.serverless.get_truncated_name(name, max_length=32)
+        self.assertEqual(truncated_name, name)
+
+    def test_get_truncated_name_exceeds_limit(self):
+        name = 'a' * 35
+        truncated_name = self.serverless.get_truncated_name(name, max_length=32)
+        self.assertEqual(truncated_name, 'a' * 29 + '...')
+
+if __name__ == '__main__':
+    unittest.main()
\ No newline at end of file

From 8db5e9fcd40d5dafd6fd4c5875180d3e6e3426ac Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Mon, 2 Dec 2024 14:43:56 -0800
Subject: [PATCH 18/42] fixed failing test in AIConnector tests

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 tests/rag/test_AiConnectorClass.py | 75 +++++++++++++++++++-----------
 1 file changed, 48 insertions(+), 27 deletions(-)

diff --git a/tests/rag/test_AiConnectorClass.py b/tests/rag/test_AiConnectorClass.py
index da8007d7..5ee3f420 100644
--- a/tests/rag/test_AiConnectorClass.py
+++ b/tests/rag/test_AiConnectorClass.py
@@ -13,7 +13,7 @@
 #  not use this file except in compliance with the License.
 #  You may obtain a copy of the License at
 #
-# 	http://www.apache.org/licenses/LICENSE-2.0
+#     http://www.apache.org/licenses/LICENSE-2.0
 #
 #  Unless required by applicable law or agreed to in writing,
 #  software distributed under the License is distributed on an
@@ -21,9 +21,11 @@
 #  KIND, either express or implied.  See the License for the
 #  specific language governing permissions and limitations
 #  under the License.
+
 import unittest
 from unittest.mock import patch, MagicMock
 import json
+import requests
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
 
@@ -39,11 +41,11 @@ def setUp(self):
         self.domain_endpoint = 'search-test-domain.us-east-1.es.amazonaws.com'
         self.domain_arn = 'arn:aws:es:us-east-1:123456789012:domain/test-domain'
 
-    @patch('AIConnectorHelper.IAMRoleHelper')
-    @patch('AIConnectorHelper.SecretHelper')
-    @patch('AIConnectorHelper.OpenSearch')
-    @patch('AIConnectorHelper.AIConnectorHelper.get_opensearch_domain_info')
-    def test___init__(self, mock_get_opensearch_domain_info, mock_opensearch, mock_secret_helper, mock_iam_role_helper):
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AIConnectorHelper.get_opensearch_domain_info')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.OpenSearch')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.SecretHelper')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.IAMRoleHelper')
+    def test___init__(self, mock_iam_role_helper, mock_secret_helper, mock_opensearch, mock_get_opensearch_domain_info):
         # Mock get_opensearch_domain_info
         mock_get_opensearch_domain_info.return_value = (self.domain_endpoint, self.domain_arn)
 
@@ -148,10 +150,8 @@ def test_get_ml_auth_success(self, mock_iam_helper):
             mock_iam_helper.get_role_arn.assert_called_with(create_connector_role_name)
             mock_iam_helper.assume_role.assert_called_with(create_connector_role_arn)
 
-            # Assert that AWS4Auth was created with the temp credentials
-            self.assertEqual(awsauth.access_id, temp_credentials["AccessKeyId"])
-            self.assertEqual(awsauth.region, self.region)
-            self.assertEqual(awsauth.service, 'es')
+            # Since AWS4Auth is instantiated within the method, we can check if awsauth is not None
+            self.assertIsNotNone(awsauth)
 
     @patch.object(AIConnectorHelper, 'iam_helper', create=True)
     def test_get_ml_auth_role_not_found(self, mock_iam_helper):
@@ -171,7 +171,7 @@ def test_get_ml_auth_role_not_found(self, mock_iam_helper):
             self.assertTrue(f"IAM role '{create_connector_role_name}' not found." in str(context.exception))
 
     @patch('requests.post')
-    @patch('AIConnectorHelper.AWS4Auth')
+    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AWS4Auth')
     @patch.object(AIConnectorHelper, 'iam_helper', create=True)
     def test_create_connector(self, mock_iam_helper, mock_aws4auth, mock_requests_post):
         # Mock the IAM helper methods
@@ -345,17 +345,26 @@ def test_deploy_model(self, mock_requests_post):
             # Call the method
             result = helper.deploy_model('test-model-id')
 
-            # Assert that the correct URL was used
+            # Assert that the method was called once
+            mock_requests_post.assert_called_once()
+
+            # Extract call arguments
+            args, kwargs = mock_requests_post.call_args
+
+            # Assert URL
             expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_deploy'
-            mock_requests_post.assert_called_once_with(
-                expected_url,
-                auth=unittest.mock.ANY,
-                headers={"Content-Type": "application/json"}
-            )
+            self.assertEqual(args[0], expected_url)
+
+            # Assert headers
+            self.assertEqual(kwargs['headers'], {"Content-Type": "application/json"})
+
+            # Assert auth
+            self.assertIsInstance(kwargs['auth'], requests.auth.HTTPBasicAuth)
+            self.assertEqual(kwargs['auth'].username, self.opensearch_domain_username)
+            self.assertEqual(kwargs['auth'].password, self.opensearch_domain_password)
 
             # Assert that the response is returned
             self.assertEqual(result, response)
-
     @patch('requests.post')
     def test_predict(self, mock_requests_post):
         # Mock requests.post
@@ -374,23 +383,35 @@ def test_predict(self, mock_requests_post):
             payload = {'input': 'test input'}
             result = helper.predict('test-model-id', payload)
 
-            # Assert that the correct URL was used
+            # Assert that the method was called once
+            mock_requests_post.assert_called_once()
+
+            # Extract call arguments
+            args, kwargs = mock_requests_post.call_args
+
+            # Assert URL
             expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_predict'
-            mock_requests_post.assert_called_once_with(
-                expected_url,
-                auth=unittest.mock.ANY,
-                json=payload,
-                headers={"Content-Type": "application/json"}
-            )
+            self.assertEqual(args[0], expected_url)
+
+            # Assert JSON payload
+            self.assertEqual(kwargs['json'], payload)
+
+            # Assert headers
+            self.assertEqual(kwargs['headers'], {"Content-Type": "application/json"})
+
+            # Assert auth
+            self.assertIsInstance(kwargs['auth'], requests.auth.HTTPBasicAuth)
+            self.assertEqual(kwargs['auth'].username, self.opensearch_domain_username)
+            self.assertEqual(kwargs['auth'].password, self.opensearch_domain_password)
 
             # Assert that the response is returned
             self.assertEqual(result, response)
 
     @patch('time.sleep', return_value=None)
     @patch.object(AIConnectorHelper, 'create_connector')
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
     @patch.object(AIConnectorHelper, 'secret_helper', create=True)
-    def test_create_connector_with_secret(self, mock_secret_helper, mock_iam_helper, mock_create_connector, mock_sleep):
+    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    def test_create_connector_with_secret(self, mock_iam_helper, mock_secret_helper, mock_create_connector, mock_sleep):
         # Mock secret_helper methods
         secret_name = 'test-secret'
         secret_value = 'test-secret-value'

From aa4292255da4369bdf8de24b22248800f0be6da8 Mon Sep 17 00:00:00 2001
From: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
Date: Mon, 2 Dec 2024 17:39:14 -0800
Subject: [PATCH 19/42] Update test_SecretsHelper

Signed-off-by: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
---
 tests/rag/test_SecretsHelper | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/rag/test_SecretsHelper b/tests/rag/test_SecretsHelper
index be00dc24..0c077d41 100644
--- a/tests/rag/test_SecretsHelper
+++ b/tests/rag/test_SecretsHelper
@@ -21,6 +21,7 @@
 #  KIND, either express or implied.  See the License for the
 #  specific language governing permissions and limitations
 #  under the License.
+
 import unittest
 from unittest.mock import patch, MagicMock
 from botocore.exceptions import ClientError
@@ -134,4 +135,4 @@ class TestSecretHelper(unittest.TestCase):
         )
 
 if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+    unittest.main()

From 5984c1989a8561afeb36275a16cae705aed2047e Mon Sep 17 00:00:00 2001
From: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
Date: Mon, 2 Dec 2024 19:52:04 -0800
Subject: [PATCH 20/42] fixed license header test_SageMakerModel.py

Signed-off-by: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
---
 tests/rag/test_ml_models/test_SageMakerModel.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/rag/test_ml_models/test_SageMakerModel.py b/tests/rag/test_ml_models/test_SageMakerModel.py
index 1041f28e..46c880ad 100644
--- a/tests/rag/test_ml_models/test_SageMakerModel.py
+++ b/tests/rag/test_ml_models/test_SageMakerModel.py
@@ -1,4 +1,3 @@
-
 # SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a

From 4503a55108f43de23a52af166aabe23a9d7b8a5d Mon Sep 17 00:00:00 2001
From: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
Date: Mon, 2 Dec 2024 20:02:03 -0800
Subject: [PATCH 21/42] fixed license header rag.py

Signed-off-by: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
---
 opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index e4d51b04..39e98617 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -1,6 +1,4 @@
-#!/usr/bin/env python3
-
-# SPDX-License-Identifier: Apache-2.0
+#!/usr/bin/env python3  # SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
@@ -20,10 +18,9 @@
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
+# KIND, either express or implied.  See the License for
+# the specific language governing permissions and limitations
 # under the License.
-
 """
 Main CLI script for OpenSearch PY ML
 """
@@ -194,4 +191,4 @@ def main():
 
 
 if __name__ == "__main__":
-    main()
\ No newline at end of file
+    main()

From b1b98abd18f295e3a0f47ecb905a455193e5f7a7 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Wed, 4 Dec 2024 17:44:17 -0800
Subject: [PATCH 22/42] Added seperate class for embedding generation, removed
 nominee text parametrs, added more functionality to user setup with knn
 index, fixed chunking proccessor to actually chunk rather, more intutituve
 user setup

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/AIConnectorHelper.py     | 202 ++++++----
 .../rag_pipeline/rag/IAMRoleHelper.py         | 104 +++--
 .../rag_pipeline/rag/SecretsHelper.py         |  80 ++--
 .../ml_commons/rag_pipeline/rag/__init__.py   |   0
 .../rag_pipeline/rag/embedding_client.py      |  63 +++
 .../ml_commons/rag_pipeline/rag/ingest.py     | 205 +++++-----
 .../rag_pipeline/rag/model_register.py        |  79 ++--
 .../rag_pipeline/rag/opensearch_connector.py  | 194 +++++++---
 .../ml_commons/rag_pipeline/rag/query.py      | 194 +++++-----
 .../ml_commons/rag_pipeline/rag/rag.py        |  43 +--
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 363 +++++++++++-------
 .../ml_commons/rag_pipeline/rag/serverless.py |  16 -
 12 files changed, 955 insertions(+), 588 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index e7babe39..a915c74b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import boto3
 import json
 import requests
@@ -29,14 +12,20 @@
 from requests_aws4auth import AWS4Auth
 import time
 from opensearchpy import OpenSearch, RequestsHttpConnection
+from urllib.parse import urlparse
 
-from IAMRoleHelper import IAMRoleHelper
-from SecretsHelper import SecretHelper
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper import SecretHelper
 from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
 
+
 class AIConnectorHelper:
+    """
+    Helper class for managing AI connectors and models in OpenSearch.
+    """
+
     def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
-                 opensearch_domain_password, aws_user_name, aws_role_name):
+                 opensearch_domain_password, aws_user_name, aws_role_name, opensearch_domain_url):
         """
         Initialize the AIConnectorHelper with necessary AWS and OpenSearch configurations.
         """
@@ -46,8 +35,9 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
         self.opensearch_domain_password = opensearch_domain_password
         self.aws_user_name = aws_user_name
         self.aws_role_name = aws_role_name
+        self.opensearch_domain_url = opensearch_domain_url
 
-        # Retrieve the OpenSearch domain endpoint and ARN
+        # Retrieve OpenSearch domain information
         domain_endpoint, domain_arn = self.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
         if domain_arn:
             self.opensearch_domain_arn = domain_arn
@@ -55,26 +45,24 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
             print("Warning: Could not retrieve OpenSearch domain ARN.")
             self.opensearch_domain_arn = None
 
-        if domain_endpoint:
-            # Construct the full domain URL
-            self.opensearch_domain_url = f'https://{domain_endpoint}'
-        else:
-            print("Warning: Could not retrieve OpenSearch domain endpoint.")
-            self.opensearch_domain_url = None
+        # Parse the OpenSearch domain URL to extract host and port
+        parsed_url = urlparse(self.opensearch_domain_url)
+        host = parsed_url.hostname
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)
 
-        # Initialize the OpenSearch client
+        # Initialize OpenSearch client
         self.opensearch_client = OpenSearch(
-            hosts=[{'host': domain_endpoint, 'port': 443}],
+            hosts=[{'host': host, 'port': port}],
             http_auth=(self.opensearch_domain_username, self.opensearch_domain_password),
-            use_ssl=True,
+            use_ssl=(parsed_url.scheme == 'https'),
             verify_certs=True,
             connection_class=RequestsHttpConnection
         )
 
-        # Initialize ModelAccessControl
+        # Initialize ModelAccessControl for managing model groups
         self.model_access_control = ModelAccessControl(self.opensearch_client)
 
-        # Initialize IAMRoleHelper and SecretHelper
+        # Initialize helpers for IAM roles and secrets management
         self.iam_helper = IAMRoleHelper(
             region=self.region,
             opensearch_domain_url=self.opensearch_domain_url,
@@ -91,6 +79,10 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
     def get_opensearch_domain_info(region, domain_name):
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
+        
+        :param region: AWS region.
+        :param domain_name: Name of the OpenSearch domain.
+        :return: Tuple containing domain endpoint and ARN.
         """
         try:
             opensearch_client = boto3.client('opensearch', region_name=region)
@@ -106,6 +98,9 @@ def get_opensearch_domain_info(region, domain_name):
     def get_ml_auth(self, create_connector_role_name):
         """
         Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
+        
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :return: AWS4Auth object with temporary credentials.
         """
         create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         if not create_connector_role_arn:
@@ -122,6 +117,13 @@ def get_ml_auth(self, create_connector_role_name):
         return awsauth
 
     def create_connector(self, create_connector_role_name, payload):
+        """
+        Create a connector in OpenSearch using the specified role and payload.
+        
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :param payload: Payload data for creating the connector.
+        :return: ID of the created connector.
+        """
         create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         temp_credentials = self.iam_helper.assume_role(create_connector_role_arn)
         awsauth = AWS4Auth(
@@ -137,21 +139,30 @@ def create_connector(self, create_connector_role_name, payload):
 
         headers = {"Content-Type": "application/json"}
 
-        r = requests.post(url, auth=awsauth, json=payload, headers=headers)
-        print(r.text)
-        connector_id = json.loads(r.text)['connector_id']
+        response = requests.post(url, auth=awsauth, json=payload, headers=headers)
+        print(response.text)
+        connector_id = json.loads(response.text).get('connector_id')
         return connector_id
 
     def search_model_group(self, model_group_name, create_connector_role_name):
         """
-        Utilize ModelAccessControl to search for a model group by name.
+        Search for a model group by name using ModelAccessControl.
+        
+        :param model_group_name: Name of the model group to search.
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :return: Search response from OpenSearch.
         """
         response = self.model_access_control.search_model_group_by_name(model_group_name, size=1)
         return response
 
     def create_model_group(self, model_group_name, description, create_connector_role_name):
         """
-        Utilize ModelAccessControl to create or retrieve an existing model group.
+        Create or retrieve an existing model group using ModelAccessControl.
+        
+        :param model_group_name: Name of the model group.
+        :param description: Description of the model group.
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :return: ID of the created or existing model group.
         """
         model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
         print("Search Model Group Response:", model_group_id)
@@ -159,10 +170,10 @@ def create_model_group(self, model_group_name, description, create_connector_rol
         if model_group_id:
             return model_group_id
 
-        # Use ModelAccessControl to register model group
+        # Register a new model group
         self.model_access_control.register_model_group(name=model_group_name, description=description)
         
-        # Retrieve the newly created model group id
+        # Retrieve the newly created model group ID
         model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
         if model_group_id:
             return model_group_id
@@ -170,19 +181,36 @@ def create_model_group(self, model_group_name, description, create_connector_rol
             raise Exception("Failed to create model group.")
 
     def get_task(self, task_id, create_connector_role_name):
+        """
+        Retrieve the status of a specific task using its ID.
+        
+        :param task_id: ID of the task to retrieve.
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :return: Response from the task retrieval request.
+        """
         try:
             awsauth = self.get_ml_auth(create_connector_role_name)
-            r = requests.get(
+            response = requests.get(
                 f'{self.opensearch_domain_url}/_plugins/_ml/tasks/{task_id}',
                 auth=awsauth
             )
-            print("Get Task Response:", r.text)
-            return r
+            print("Get Task Response:", response.text)
+            return response
         except Exception as e:
             print(f"Error in get_task: {e}")
             raise
 
     def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
+        """
+        Create a new model in OpenSearch and optionally deploy it.
+        
+        :param model_name: Name of the model to create.
+        :param description: Description of the model.
+        :param connector_id: ID of the connector to associate with the model.
+        :param create_connector_role_name: Name of the IAM role to assume.
+        :param deploy: Boolean indicating whether to deploy the model immediately.
+        :return: ID of the created model.
+        """
         try:
             model_group_id = self.create_model_group(model_name, description, create_connector_role_name)
             payload = {
@@ -197,37 +225,43 @@ def create_model(self, model_name, description, connector_id, create_connector_r
 
             awsauth = self.get_ml_auth(create_connector_role_name)
 
-            r = requests.post(
+            response = requests.post(
                 f'{self.opensearch_domain_url}/_plugins/_ml/models/_register?deploy={deploy_str}',
                 auth=awsauth,
                 json=payload,
                 headers=headers
             )
 
-            print("Create Model Response:", r.text)
-            response = json.loads(r.text)
+            print("Create Model Response:", response.text)
+            response_data = json.loads(response.text)
 
-            if 'model_id' in response:
-                return response['model_id']
-            elif 'task_id' in response:
+            if 'model_id' in response_data:
+                return response_data['model_id']
+            elif 'task_id' in response_data:
                 # Handle asynchronous task
                 time.sleep(2)  # Wait for task to complete
-                task_response = self.get_task(response['task_id'], create_connector_role_name)
+                task_response = self.get_task(response_data['task_id'], create_connector_role_name)
                 print("Task Response:", task_response.text)
                 task_result = json.loads(task_response.text)
                 if 'model_id' in task_result:
                     return task_result['model_id']
                 else:
                     raise KeyError(f"'model_id' not found in task response: {task_result}")
-            elif 'error' in response:
-                raise Exception(f"Error creating model: {response['error']}")
+            elif 'error' in response_data:
+                raise Exception(f"Error creating model: {response_data['error']}")
             else:
-                raise KeyError(f"The response does not contain 'model_id' or 'task_id'. Response content: {response}")
+                raise KeyError(f"The response does not contain 'model_id' or 'task_id'. Response content: {response_data}")
         except Exception as e:
             print(f"Error in create_model: {e}")
             raise
 
     def deploy_model(self, model_id):
+        """
+        Deploy a specified model in OpenSearch.
+        
+        :param model_id: ID of the model to deploy.
+        :return: Response from the deployment request.
+        """
         headers = {"Content-Type": "application/json"}
         response = requests.post(
             f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy',
@@ -238,19 +272,37 @@ def deploy_model(self, model_id):
         return response
 
     def predict(self, model_id, payload):
+        """
+        Make a prediction using the specified model and input payload.
+        
+        :param model_id: ID of the model to use for prediction.
+        :param payload: Input data for prediction.
+        :return: Response from the prediction request.
+        """
         headers = {"Content-Type": "application/json"}
-        r = requests.post(
+        response = requests.post(
             f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_predict',
             auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
             json=payload,
             headers=headers
         )
-        print("Predict Response:", r.text)
-        return r
+        print("Predict Response:", response.text)
+        return response
 
     def create_connector_with_secret(self, secret_name, secret_value, connector_role_name, create_connector_role_name,
                                      create_connector_input, sleep_time_in_seconds=10):
-        # Step1: Create Secret
+        """
+        Create a connector in OpenSearch using a secret for credentials.
+        
+        :param secret_name: Name of the secret to create or use.
+        :param secret_value: Value of the secret.
+        :param connector_role_name: Name of the IAM role for the connector.
+        :param create_connector_role_name: Name of the IAM role to assume for creating the connector.
+        :param create_connector_input: Input payload for creating the connector.
+        :param sleep_time_in_seconds: Time to wait for IAM role propagation.
+        :return: ID of the created connector.
+        """
+        # Step 1: Create Secret
         print('Step1: Create Secret')
         if not self.secret_helper.secret_exists(secret_name):
             secret_arn = self.secret_helper.create_secret(secret_name, secret_value)
@@ -259,7 +311,7 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
             secret_arn = self.secret_helper.get_secret_arn(secret_name)
         print('----------')
 
-        # Step2: Create IAM role configured in connector
+        # Step 2: Create IAM role configured in connector
         trust_policy = {
             "Version": "2012-10-17",
             "Statement": [
@@ -296,7 +348,7 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
         print('----------')
 
         # Step 3: Configure IAM role in OpenSearch
-        # 3.1 Create IAM role for Signing create connector request
+        # 3.1 Create IAM role for signing create connector request
         user_arn = self.iam_helper.get_user_arn(self.aws_user_name)
         role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
         statements = []
@@ -347,20 +399,14 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
             create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         print('----------')
 
-        # 3.2 Map backend role
+        # 3.2 Map IAM role to backend role in OpenSearch
         print(f'Step 3.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
         print('----------')
 
         # Step 4: Create connector
         print('Step 4: Create connector in OpenSearch')
-        # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
-        # During this time, some services might not immediately recognize the new role or its permissions.
-        # So we wait for some time before creating connector.
-        # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
-        # you can rerun this function.
-
-        # Wait for some time
+        # Wait to ensure IAM role propagation
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
         payload['credential'] = {
@@ -373,7 +419,17 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
 
     def create_connector_with_role(self, connector_role_inline_policy, connector_role_name, create_connector_role_name,
                                    create_connector_input, sleep_time_in_seconds=10):
-        # Step1: Create IAM role configured in connector
+        """
+        Create a connector in OpenSearch using an IAM role for credentials.
+        
+        :param connector_role_inline_policy: Inline policy for the connector IAM role.
+        :param connector_role_name: Name of the IAM role for the connector.
+        :param create_connector_role_name: Name of the IAM role to assume for creating the connector.
+        :param create_connector_input: Input payload for creating the connector.
+        :param sleep_time_in_seconds: Time to wait for IAM role propagation.
+        :return: ID of the created connector.
+        """
+        # Step 1: Create IAM role configured in connector
         trust_policy = {
             "Version": "2012-10-17",
             "Statement": [
@@ -397,7 +453,7 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
         print('----------')
 
         # Step 2: Configure IAM role in OpenSearch
-        # 2.1 Create IAM role for Signing create connector request
+        # 2.1 Create IAM role for signing create connector request
         user_arn = self.iam_helper.get_user_arn(self.aws_user_name)
         role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
         statements = []
@@ -448,20 +504,14 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
             create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         print('----------')
 
-        # 2.2 Map backend role
+        # 2.2 Map IAM role to backend role in OpenSearch
         print(f'Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
         print('----------')
 
         # Step 3: Create connector
         print('Step 3: Create connector in OpenSearch')
-        # When you create an IAM role, it can take some time for the changes to propagate across AWS systems.
-        # During this time, some services might not immediately recognize the new role or its permissions.
-        # So we wait for some time before creating connector.
-        # If you see such error: ClientError: An error occurred (AccessDenied) when calling the AssumeRole operation
-        # you can rerun this function.
-
-        # Wait for some time
+        # Wait to ensure IAM role propagation
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
         payload['credential'] = {
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
index bbb62f1c..b4b5de90 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
@@ -5,31 +5,30 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import boto3
 import json
 from botocore.exceptions import ClientError
 import requests
 
+
 class IAMRoleHelper:
+    """
+    Helper class for managing IAM roles and their interactions with OpenSearch.
+    """
+
     def __init__(self, region, opensearch_domain_url=None, opensearch_domain_username=None,
                  opensearch_domain_password=None, aws_user_name=None, aws_role_name=None, opensearch_domain_arn=None):
+        """
+        Initialize the IAMRoleHelper with AWS and OpenSearch configurations.
+        
+        :param region: AWS region.
+        :param opensearch_domain_url: URL of the OpenSearch domain.
+        :param opensearch_domain_username: Username for OpenSearch domain authentication.
+        :param opensearch_domain_password: Password for OpenSearch domain authentication.
+        :param aws_user_name: AWS IAM user name.
+        :param aws_role_name: AWS IAM role name.
+        :param opensearch_domain_arn: ARN of the OpenSearch domain.
+        """
         self.region = region
         self.opensearch_domain_url = opensearch_domain_url
         self.opensearch_domain_username = opensearch_domain_username
@@ -39,6 +38,12 @@ def __init__(self, region, opensearch_domain_url=None, opensearch_domain_usernam
         self.opensearch_domain_arn = opensearch_domain_arn
 
     def role_exists(self, role_name):
+        """
+        Check if an IAM role exists.
+        
+        :param role_name: Name of the IAM role.
+        :return: True if the role exists, False otherwise.
+        """
         iam_client = boto3.client('iam')
 
         try:
@@ -52,22 +57,27 @@ def role_exists(self, role_name):
                 return False
 
     def delete_role(self, role_name):
+        """
+        Delete an IAM role along with its attached policies.
+        
+        :param role_name: Name of the IAM role to delete.
+        """
         iam_client = boto3.client('iam')
 
         try:
-            # Detach managed policies
+            # Detach managed policies from the role
             policies = iam_client.list_attached_role_policies(RoleName=role_name)['AttachedPolicies']
             for policy in policies:
                 iam_client.detach_role_policy(RoleName=role_name, PolicyArn=policy['PolicyArn'])
             print(f'All managed policies detached from role {role_name}.')
 
-            # Delete inline policies
+            # Delete inline policies associated with the role
             inline_policies = iam_client.list_role_policies(RoleName=role_name)['PolicyNames']
             for policy_name in inline_policies:
                 iam_client.delete_role_policy(RoleName=role_name, PolicyName=policy_name)
             print(f'All inline policies deleted from role {role_name}.')
 
-            # Now, delete the role
+            # Finally, delete the IAM role
             iam_client.delete_role(RoleName=role_name)
             print(f'Role {role_name} deleted.')
 
@@ -78,23 +88,31 @@ def delete_role(self, role_name):
                 print(f"An error occurred: {e}")
 
     def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
+        """
+        Create a new IAM role with specified trust and inline policies.
+        
+        :param role_name: Name of the IAM role to create.
+        :param trust_policy_json: Trust policy document in JSON format.
+        :param inline_policy_json: Inline policy document in JSON format.
+        :return: ARN of the created role or None if creation failed.
+        """
         iam_client = boto3.client('iam')
 
         try:
-            # Create the role with the trust policy
+            # Create the role with the provided trust policy
             create_role_response = iam_client.create_role(
                 RoleName=role_name,
                 AssumeRolePolicyDocument=json.dumps(trust_policy_json),
                 Description='Role with custom trust and inline policies',
             )
 
-            # Get the ARN of the newly created role
+            # Retrieve the ARN of the newly created role
             role_arn = create_role_response['Role']['Arn']
 
             # Attach the inline policy to the role
             iam_client.put_role_policy(
                 RoleName=role_name,
-                PolicyName='InlinePolicy',  # you can replace this with your preferred policy name
+                PolicyName='InlinePolicy',  # Replace with preferred policy name if needed
                 PolicyDocument=json.dumps(inline_policy_json)
             )
 
@@ -106,12 +124,17 @@ def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
             return None
 
     def get_role_arn(self, role_name):
+        """
+        Retrieve the ARN of an IAM role.
+        
+        :param role_name: Name of the IAM role.
+        :return: ARN of the role or None if not found.
+        """
         if not role_name:
             return None
         iam_client = boto3.client('iam')
         try:
             response = iam_client.get_role(RoleName=role_name)
-            # Return ARN of the role
             return response['Role']['Arn']
         except ClientError as e:
             if e.response['Error']['Code'] == 'NoSuchEntity':
@@ -122,6 +145,11 @@ def get_role_arn(self, role_name):
                 return None
 
     def get_role_details(self, role_name):
+        """
+        Print detailed information about an IAM role.
+        
+        :param role_name: Name of the IAM role.
+        """
         iam = boto3.client('iam')
 
         try:
@@ -135,6 +163,7 @@ def get_role_details(self, role_name):
             print("Assume Role Policy Document:")
             print(json.dumps(role['AssumeRolePolicyDocument'], indent=4, sort_keys=True))
 
+            # List and print all inline policies attached to the role
             list_role_policies_response = iam.list_role_policies(RoleName=role_name)
 
             for policy_name in list_role_policies_response['PolicyNames']:
@@ -150,6 +179,12 @@ def get_role_details(self, role_name):
                 print(f"An error occurred: {e}")
 
     def get_user_arn(self, username):
+        """
+        Retrieve the ARN of an IAM user.
+        
+        :param username: Name of the IAM user.
+        :return: ARN of the user or None if not found.
+        """
         if not username:
             return None
         iam_client = boto3.client('iam')
@@ -167,6 +202,13 @@ def get_user_arn(self, username):
                 return None
 
     def assume_role(self, role_arn, role_session_name="your_session_name"):
+        """
+        Assume an IAM role and obtain temporary security credentials.
+        
+        :param role_arn: ARN of the IAM role to assume.
+        :param role_session_name: Identifier for the assumed role session.
+        :return: Temporary security credentials or None if the operation fails.
+        """
         sts_client = boto3.client('sts')
 
         try:
@@ -175,7 +217,7 @@ def assume_role(self, role_arn, role_session_name="your_session_name"):
                 RoleSessionName=role_session_name,
             )
 
-            # Obtain the temporary credentials from the assumed role 
+            # Extract temporary credentials from the assumed role
             temp_credentials = assumed_role_object["Credentials"]
 
             return temp_credentials
@@ -184,7 +226,12 @@ def assume_role(self, role_arn, role_session_name="your_session_name"):
             return None
 
     def map_iam_role_to_backend_role(self, iam_role_arn):
-        os_security_role = 'ml_full_access'  # Changed from 'all_access' to 'ml_full_access'
+        """
+        Map an IAM role to an OpenSearch backend role for access control.
+        
+        :param iam_role_arn: ARN of the IAM role to map.
+        """
+        os_security_role = 'ml_full_access'  # Defines the OpenSearch security role to map to
         url = f'{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}'
 
         payload = {
@@ -211,7 +258,10 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
 
     def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
-        Extract the IAM user name from the IAM principal ARN.
+        Extract the IAM user name from an IAM principal ARN.
+        
+        :param iam_principal_arn: ARN of the IAM principal.
+        :return: IAM user name or None if extraction fails.
         """
         # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
         if iam_principal_arn and ':user/' in iam_principal_arn:
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
index 7c454f57..c675c12c 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
@@ -5,81 +5,117 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import logging
 import boto3
 import json
 from botocore.exceptions import ClientError
 
+# Configure the logger for this module
 logger = logging.getLogger(__name__)
 
+
 class SecretHelper:
-    def __init__(self, region):
+    """
+    Helper class for managing secrets in AWS Secrets Manager.
+    Provides methods to check existence, retrieve ARN, get secret values, and create new secrets.
+    """
+
+    def __init__(self, region: str):
+        """
+        Initialize the SecretHelper with the specified AWS region.
+
+        :param region: AWS region where the Secrets Manager is located.
+        """
         self.region = region
 
-    def secret_exists(self, secret_name):
+    def secret_exists(self, secret_name: str) -> bool:
+        """
+        Check if a secret with the given name exists in AWS Secrets Manager.
+
+        :param secret_name: Name of the secret to check.
+        :return: True if the secret exists, False otherwise.
+        """
+        # Initialize the Secrets Manager client
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
+            # Attempt to retrieve the secret value
             secretsmanager.get_secret_value(SecretId=secret_name)
             return True
         except ClientError as e:
+            # If the secret does not exist, return False
             if e.response['Error']['Code'] == 'ResourceNotFoundException':
                 return False
             else:
+                # Log other client errors and return False
                 logger.error(f"An error occurred: {e}")
                 return False
 
-    def get_secret_arn(self, secret_name):
+    def get_secret_arn(self, secret_name: str) -> str:
+        """
+        Retrieve the ARN of a secret in AWS Secrets Manager.
+
+        :param secret_name: Name of the secret.
+        :return: ARN of the secret if found, None otherwise.
+        """
+        # Initialize the Secrets Manager client
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
+            # Describe the secret to get its details
             response = secretsmanager.describe_secret(SecretId=secret_name)
             return response['ARN']
         except ClientError as e:
+            # Handle the case where the secret does not exist
             if e.response['Error']['Code'] == 'ResourceNotFoundException':
                 logger.warning(f"The requested secret {secret_name} was not found")
                 return None
             else:
+                # Log other client errors and return None
                 logger.error(f"An error occurred: {e}")
                 return None
 
-    def get_secret(self, secret_name):
+    def get_secret(self, secret_name: str) -> str:
+        """
+        Retrieve the secret value from AWS Secrets Manager.
+
+        :param secret_name: Name of the secret.
+        :return: Secret value as a string if found, None otherwise.
+        """
+        # Initialize the Secrets Manager client
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
+            # Get the secret value
             response = secretsmanager.get_secret_value(SecretId=secret_name)
             return response.get('SecretString')
         except ClientError as e:
+            # Handle the case where the secret does not exist
             if e.response['Error']['Code'] == 'ResourceNotFoundException':
                 logger.warning("The requested secret was not found")
                 return None
             else:
+                # Log other client errors and return None
                 logger.error(f"An error occurred: {e}")
                 return None
 
-    def create_secret(self, secret_name, secret_value):
+    def create_secret(self, secret_name: str, secret_value: dict) -> str:
+        """
+        Create a new secret in AWS Secrets Manager.
+
+        :param secret_name: Name of the secret to create.
+        :param secret_value: Dictionary containing the secret data.
+        :return: ARN of the created secret if successful, None otherwise.
+        """
+        # Initialize the Secrets Manager client
         secretsmanager = boto3.client('secretsmanager', region_name=self.region)
         try:
+            # Create the secret with the provided name and value
             response = secretsmanager.create_secret(
                 Name=secret_name,
                 SecretString=json.dumps(secret_value),
             )
+            # Log success and return the secret's ARN
             logger.info(f'Secret {secret_name} created successfully.')
             return response['ARN']
         except ClientError as e:
+            # Log errors during secret creation and return None
             logger.error(f'Error creating secret: {e}')
             return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py
new file mode 100644
index 00000000..acfe6a45
--- /dev/null
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py
@@ -0,0 +1,63 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+import time
+
+class EmbeddingClient:
+    def __init__(self, opensearch_client, embedding_model_id):
+        self.opensearch_client = opensearch_client
+        self.embedding_model_id = embedding_model_id
+
+    def get_text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+        """
+        Generate a text embedding using OpenSearch's ML API with retry logic.
+
+        :param text: Text to generate embedding for.
+        :param max_retries: Maximum number of retry attempts.
+        :param initial_delay: Initial delay between retries in seconds.
+        :param backoff_factor: Factor by which the delay increases after each retry.
+        :return: Embedding vector or None if generation fails.
+        """
+        delay = initial_delay
+        for attempt in range(max_retries):
+            try:
+                payload = {
+                    "text_docs": [text]
+                }
+                response = self.opensearch_client.transport.perform_request(
+                    method="POST",
+                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
+                    body=payload
+                )
+                inference_results = response.get('inference_results', [])
+                if not inference_results:
+                    print(f"No inference results returned for text: {text}")
+                    return None
+                output = inference_results[0].get('output')
+
+                # Adjust the extraction of embedding data
+                if isinstance(output, list) and len(output) > 0:
+                    embedding_dict = output[0]
+                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
+                        embedding = embedding_dict['data']
+                    else:
+                        print(f"Unexpected embedding output format: {output}")
+                        return None
+                elif isinstance(output, dict) and 'data' in output:
+                    embedding = output['data']
+                else:
+                    print(f"Unexpected embedding output format: {output}")
+                    return None
+
+                return embedding
+            except Exception as ex:
+                print(f"Error on attempt {attempt + 1}: {ex}")
+                if attempt == max_retries - 1:
+                    raise
+                time.sleep(delay)
+                delay *= backoff_factor
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 0ec4ea2c..1a27a641 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import os
 import glob
 import json
@@ -36,39 +19,59 @@
 import time
 import random
 from opensearchpy import exceptions as opensearch_exceptions
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import EmbeddingClient
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
 
-from opensearch_connector import OpenSearchConnector
-
+# Initialize colorama for colored terminal output
 init(autoreset=True)  # Initialize colorama
 
+
 class Ingest:
+    """
+    Helper class for ingesting various file types into OpenSearch.
+    """
+
     def __init__(self, config):
-        # Initialize the Ingest class with configuration
+        """
+        Initialize the Ingest class with configuration.
+
+        :param config: Configuration dictionary containing necessary parameters.
+        """
         self.config = config
         self.aws_region = config.get('region')
         self.index_name = config.get('index_name')
         self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
         self.embedding_model_id = config.get('embedding_model_id')
+        self.embedding_client = None  # Will be initialized after OpenSearch client is ready
         self.pipeline_name = config.get('ingest_pipeline_name', 'text-chunking-ingest-pipeline')
 
-        if not self.embedding_model_id:
-            print("Embedding model ID is not set. Please run setup first.")
-            return
+    def initialize_clients(self) -> bool:
+        """
+        Initialize the OpenSearch client and the EmbeddingClient.
 
-    def initialize_clients(self):
-        # Initialize OpenSearch client
+        :return: True if initialization is successful, False otherwise.
+        """
         if self.opensearch.initialize_opensearch_client():
             print("OpenSearch client initialized successfully.")
+
+            # Now that OpenSearch client is initialized, initialize the embedding client
+            if not self.embedding_model_id:
+                print("Embedding model ID is not set. Please run setup first.")
+                return False
+
+            self.embedding_client = EmbeddingClient(self.opensearch.opensearch_client, self.embedding_model_id)
             return True
         else:
             print("Failed to initialize OpenSearch client.")
             return False
-
+        
     def ingest_command(self, paths: List[str]):
-        # Main ingestion command
-        # Processes all valid files in the given paths and initiates ingestion
+        """
+        Main ingestion command that processes and ingests all valid files from the provided paths.
 
+        :param paths: List of file or directory paths to ingest.
+        """
         all_files = []
         for path in paths:
             if os.path.isfile(path):
@@ -80,18 +83,25 @@ def ingest_command(self, paths: List[str]):
             else:
                 print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
 
+        # Define supported file extensions
         supported_extensions = ['.csv', '.txt', '.pdf']
         valid_files = [f for f in all_files if any(f.lower().endswith(ext) for ext in supported_extensions)]
 
+        # Check if there are valid files to ingest
         if not valid_files:
             print(f"{Fore.RED}No valid files found for ingestion.{Style.RESET_ALL}")
             return
 
         print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
 
+        # Process and ingest data from valid files
         self.process_and_ingest_data(valid_files)
 
     def process_and_ingest_data(self, file_paths: List[str]):
+        """
+        Processes the provided files, generates embeddings, and ingests the data into OpenSearch.
+        """
+        # Initialize clients before ingestion
         if not self.initialize_clients():
             print("Failed to initialize clients. Aborting ingestion.")
             return
@@ -99,6 +109,11 @@ def process_and_ingest_data(self, file_paths: List[str]):
         # Create the ingest pipeline
         self.create_ingest_pipeline(self.pipeline_name)
 
+        # Retrieve field names from the config
+        passage_text_field = self.config.get('passage_text_field', 'passage_text')
+        passage_chunk_field = self.config.get('passage_chunk_field', 'passage_chunk')
+        embedding_field = self.config.get('embedding_field', 'passage_embedding')
+
         all_documents = []
         for file_path in file_paths:
             print(f"\nProcessing file: {file_path}")
@@ -111,10 +126,12 @@ def process_and_ingest_data(self, file_paths: List[str]):
         print("\nGenerating embeddings for the documents...")
         success_count = 0
         error_count = 0
+
+        # Progress bar for embedding generation
         with tqdm(total=total_documents, bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]') as pbar:
             for doc in all_documents:
                 try:
-                    embedding = self.text_embedding(doc['text'])
+                    embedding = self.embedding_client.get_text_embedding(doc['text'])
                     if embedding is not None:
                         doc['embedding'] = embedding
                         success_count += 1
@@ -130,6 +147,7 @@ def process_and_ingest_data(self, file_paths: List[str]):
         print(f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}")
         print(f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}")
 
+        # Check if there are documents to ingest
         if success_count == 0:
             print(f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}")
             return
@@ -142,52 +160,82 @@ def process_and_ingest_data(self, file_paths: List[str]):
                     "_op_type": "index",
                     "_index": self.index_name,
                     "_source": {
-                        "nominee_text": doc['text'],
-                        "nominee_vector": doc['embedding']
+                        passage_text_field: doc['text'],
+                        embedding_field: {
+                            "knn": doc['embedding']
+                        }
                     },
-                    "pipeline": self.pipeline_name  # Use the pipeline name specified in the config
+                    "pipeline": self.pipeline_name
                 }
                 actions.append(action)
 
+        # Bulk index the documents into OpenSearch
         success, failed = self.opensearch.bulk_index(actions)
         print(f"\n{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
         print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
 
-    def create_ingest_pipeline(self, pipeline_id):
-        # Check if pipeline exists
+
+    def create_ingest_pipeline(self, pipeline_id: str):
+        """
+        Creates an ingest pipeline in OpenSearch if it does not already exist.
+        :param pipeline_id: ID of the ingest pipeline to create.
+        """
         try:
-            response = self.opensearch.opensearch_client.ingest.get_pipeline(id=pipeline_id)
+            # Check if the pipeline already exists
+            self.opensearch.opensearch_client.ingest.get_pipeline(id=pipeline_id)
             print(f"\nIngest pipeline '{pipeline_id}' already exists.")
         except opensearch_exceptions.NotFoundError:
             # Pipeline does not exist, create it
+            embedding_dimension = int(self.config.get('embedding_dimension', 768))
+            # Calculate token_limit based on embedding dimension if not set
+            token_limit = int(self.config.get('token_limit', int(embedding_dimension * 0.75)))
+            tokenizer = self.config.get('tokenizer', 'standard')
+            overlap_rate = float(self.config.get('overlap_rate', 0.2))
+            source_field = self.config.get('passage_text_field', 'passage_text')
+            target_field = self.config.get('passage_chunk_field', 'passage_chunk')
+            embedding_field = self.config.get('embedding_field', 'passage_embedding')
+            model_id = self.embedding_model_id
+
             pipeline_body = {
-                "description": "A text chunking ingest pipeline",
+                "description": "A text chunking and embedding ingest pipeline",
                 "processors": [
                     {
                         "text_chunking": {
                             "algorithm": {
                                 "fixed_token_length": {
-                                    "token_limit": 384,
-                                    "overlap_rate": 0.2,
-                                    "tokenizer": "standard"
+                                    "token_limit": token_limit,
+                                    "overlap_rate": overlap_rate,
+                                    "tokenizer": tokenizer
                                 }
                             },
                             "field_map": {
-                                "nominee_text": "passage_chunk"
+                                source_field: target_field
+                            }
+                        }
+                    },
+                    {
+                        "text_embedding": {
+                            "model_id": model_id,
+                            "field_map": {
+                                target_field: embedding_field
                             }
                         }
                     }
                 ]
             }
+            # Create the ingest pipeline
             self.opensearch.opensearch_client.ingest.put_pipeline(id=pipeline_id, body=pipeline_body)
             print(f"\nIngest pipeline '{pipeline_id}' created successfully.")
         except Exception as e:
             print(f"\nError checking or creating ingest pipeline: {e}")
 
     def process_file(self, file_path: str) -> List[Dict[str, str]]:
-        # Process a file based on its extension
-        # Supports CSV, TXT, and PDF files
-        # Returns a list of dictionaries containing extracted text
+        """
+        Processes a file based on its extension and extracts text.
+
+        :param file_path: Path to the file to process.
+        :return: List of dictionaries containing extracted text.
+        """
         _, file_extension = os.path.splitext(file_path)
 
         if file_extension.lower() == '.csv':
@@ -201,9 +249,12 @@ def process_file(self, file_path: str) -> List[Dict[str, str]]:
             return []
 
     def process_csv(self, file_path: str) -> List[Dict[str, str]]:
-        # Process a CSV file
-        # Extracts information and returns a list of dictionaries
-        # Each dictionary contains the entire row content
+        """
+        Processes a CSV file and extracts each row as a JSON string.
+
+        :param file_path: Path to the CSV file.
+        :return: List of dictionaries with extracted text.
+        """
         documents = []
         with open(file_path, 'r', newline='', encoding='utf-8') as csvfile:
             reader = csv.DictReader(csvfile)
@@ -212,17 +263,23 @@ def process_csv(self, file_path: str) -> List[Dict[str, str]]:
         return documents
 
     def process_txt(self, file_path: str) -> List[Dict[str, str]]:
-        # Process a TXT file
-        # Reads the entire content of the file
-        # Returns a list with a single dictionary containing the file content
+        """
+        Processes a TXT file and reads its entire content.
+
+        :param file_path: Path to the TXT file.
+        :return: List containing a single dictionary with the file content.
+        """
         with open(file_path, 'r') as txtfile:
             content = txtfile.read()
         return [{"text": content}]
 
     def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
-        # Process a PDF file
-        # Extracts text from each page of the PDF
-        # Returns a list of dictionaries, each containing text from a page
+        """
+        Processes a PDF file and extracts text from each page.
+
+        :param file_path: Path to the PDF file.
+        :return: List of dictionaries, each containing text from a page.
+        """
         documents = []
         with open(file_path, 'rb') as pdffile:
             pdf_reader = PyPDF2.PdfReader(pdffile)
@@ -232,47 +289,3 @@ def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
                     documents.append({"text": extracted_text})
         return documents
 
-    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
-        if self.opensearch is None:
-            print("OpenSearch client is not initialized. Please run setup first.")
-            return None
-
-        delay = initial_delay
-        for attempt in range(max_retries):
-            try:
-                payload = {
-                    "text_docs": [text]
-                }
-                response = self.opensearch.opensearch_client.transport.perform_request(
-                    method="POST",
-                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
-                    body=payload
-                )
-                inference_results = response.get('inference_results', [])
-                if not inference_results:
-                    print(f"No inference results returned for text: {text}")
-                    return None
-                output = inference_results[0].get('output')
-
-                # Adjust the extraction of embedding data
-                if isinstance(output, list) and len(output) > 0:
-                    embedding_dict = output[0]
-                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
-                        embedding = embedding_dict['data']
-                    else:
-                        print(f"Unexpected embedding output format: {output}")
-                        return None
-                elif isinstance(output, dict) and 'data' in output:
-                    embedding = output['data']
-                else:
-                    print(f"Unexpected embedding output format: {output}")
-                    return None
-
-                return embedding
-            except Exception as ex:
-                print(f"Error on attempt {attempt + 1}: {ex}")
-                if attempt == max_retries - 1:
-                    raise
-                time.sleep(delay)
-                delay *= backoff_factor
-        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
index ea6600fc..da21c62d 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -6,53 +6,51 @@
 # GitHub history for details.
 
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
-
 import os
 import json
 import time
 import boto3
 from urllib.parse import urlparse
 from colorama import Fore, Style, init
-from AIConnectorHelper import AIConnectorHelper
-from IAMRoleHelper import IAMRoleHelper
-from ml_models.BedrockModel import BedrockModel
-from ml_models.OpenAIModel import OpenAIModel
-from ml_models.CohereModel import CohereModel
-from ml_models.HuggingFaceModel import HuggingFaceModel
-from ml_models.PyTorchModel import CustomPyTorchModel
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import BedrockModel
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import OpenAIModel
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import CohereModel
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.HuggingFaceModel import HuggingFaceModel
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import CustomPyTorchModel
 import sys
 
+# Initialize colorama for colored terminal output
 init(autoreset=True)
 
+
 class ModelRegister:
+    """
+    Handles the registration of various embedding models with OpenSearch.
+    Supports multiple model providers and manages their integration.
+    """
+
     def __init__(self, config, opensearch_client, opensearch_domain_name):
-        # Initialize ModelRegister with necessary configurations
+        """
+        Initialize ModelRegister with necessary configurations.
+
+        :param config: Configuration dictionary containing necessary parameters.
+        :param opensearch_client: Instance of the OpenSearch client.
+        :param opensearch_domain_name: Name of the OpenSearch domain.
+        """
         self.config = config
         self.aws_region = config.get('region')
         self.opensearch_client = opensearch_client
         self.opensearch_domain_name = opensearch_domain_name
+        self.opensearch_endpoint = config.get('opensearch_endpoint')
         self.opensearch_username = config.get('opensearch_username')
         self.opensearch_password = config.get('opensearch_password')
         self.iam_principal = config.get('iam_principal')
         self.embedding_dimension = int(config.get('embedding_dimension', 768))
         self.service_type = config.get('service_type', 'managed')
+
+        # Initialize IAMRoleHelper with necessary parameters
         self.iam_role_helper = IAMRoleHelper(
             self.aws_region,
             self.opensearch_domain_name,
@@ -60,8 +58,12 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
             self.opensearch_password,
             self.iam_principal
         )
+
+        # Initialize AWS clients if the service type is not open-source
         if self.service_type != 'open-source':
             self.initialize_clients()
+
+        # Initialize instances of different model providers
         self.bedrock_model = BedrockModel(
             aws_region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
@@ -98,13 +100,18 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
             iam_role_helper=self.iam_role_helper
         )
 
-    def initialize_clients(self):
-        # Initialize AWS clients only if necessary
+    def initialize_clients(self) -> bool:
+        """
+        Initialize AWS clients based on the service type.
+
+        :return: True if clients are initialized successfully, False otherwise.
+        """
         if self.service_type in ['managed', 'serverless']:
             try:
+                # Initialize Bedrock client for managed services
                 self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
                 # Add any other clients initialization if needed
-                time.sleep(7)
+                time.sleep(7)  # Wait for client initialization
                 print("AWS clients initialized successfully.")
                 return True
             except Exception as e:
@@ -116,7 +123,7 @@ def initialize_clients(self):
 
     def prompt_model_registration(self):
         """
-        Prompt the user to register a model or input an existing model ID.
+        Prompt the user to either register a new embedding model or use an existing model ID.
         """
         print("\nTo proceed, you need to configure an embedding model.")
         print("1. Register a new embedding model")
@@ -139,7 +146,11 @@ def prompt_model_registration(self):
             sys.exit(1)  # Exit the setup as we cannot proceed without a valid choice
 
     def save_config(self, config):
-        # Save configuration to the config file
+        """
+        Save the updated configuration to the config file.
+
+        :param config: Configuration dictionary to save.
+        """
         import configparser
         parser = configparser.ConfigParser()
         parser['DEFAULT'] = config
@@ -168,13 +179,15 @@ def register_model_interactive(self):
             aws_user_name = input("Enter your AWS IAM user name: ")
 
         # Instantiate AIConnectorHelper
+
         helper = AIConnectorHelper(
             region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_domain_username=self.opensearch_username,
             opensearch_domain_password=self.opensearch_password,
             aws_user_name=aws_user_name,
-            aws_role_name=None  # Set to None or provide if applicable
+            aws_role_name=None,  # Set to None or provide if applicable
+            opensearch_domain_url=self.opensearch_endpoint  # Pass the endpoint from config
         )
 
         # Prompt user to select a model
@@ -215,7 +228,7 @@ def register_model_interactive(self):
 
     def prompt_opensource_model_registration(self):
         """
-        Handle model registration for open-source OpenSearch.
+        Handle model registration specifically for open-source OpenSearch.
         """
         print("\nWould you like to register an embedding model now?")
         print("1. Yes, register a new model")
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 59433193..1bf12dbc 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -5,31 +5,25 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth, exceptions as opensearch_exceptions
 import boto3
 from urllib.parse import urlparse
 from opensearchpy import helpers as opensearch_helpers
 
+
 class OpenSearchConnector:
+    """
+    Manages the connection and interactions with the OpenSearch cluster.
+    Provides methods to initialize the client, create indices, perform bulk indexing, and execute searches.
+    """
+
     def __init__(self, config):
-        # Initialize the OpenSearchConnector with configuration
+        """
+        Initialize the OpenSearchConnector with the provided configuration.
+
+        :param config: Dictionary containing configuration parameters.
+        """
+        # Store the configuration
         self.config = config
         self.opensearch_client = None
         self.aws_region = config.get('region')
@@ -40,122 +34,200 @@ def __init__(self, config):
         self.opensearch_password = config.get('opensearch_password')
         self.service_type = config.get('service_type')
 
-    def initialize_opensearch_client(self):
-        # Initialize the OpenSearch client
+    def initialize_opensearch_client(self) -> bool:
+        """
+        Initialize the OpenSearch client based on the service type and configuration.
+
+        :return: True if the client is initialized successfully, False otherwise.
+        """
+        # Check if the OpenSearch endpoint is provided
         if not self.opensearch_endpoint:
             print("OpenSearch endpoint not set. Please run setup first.")
             return False
 
+        # Parse the OpenSearch endpoint URL
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
         port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
+        # Determine the authentication method based on the service type
         if self.service_type == 'serverless':
+            # Use AWS V4 Signer Authentication for serverless
             credentials = boto3.Session().get_credentials()
             auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
         elif self.service_type == 'managed':
+            # Use basic authentication for managed services
             if not self.opensearch_username or not self.opensearch_password:
                 print("OpenSearch username or password not set. Please run setup first.")
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
         elif self.service_type == 'open-source':
+            # Use basic authentication if credentials are provided, else no authentication
             if self.opensearch_username and self.opensearch_password:
                 auth = (self.opensearch_username, self.opensearch_password)
             else:
                 auth = None  # No authentication
         else:
+            # Invalid service type
             print("Invalid service type. Please check your configuration.")
             return False
 
+        # Determine SSL settings based on the endpoint scheme
+        use_ssl = parsed_url.scheme == 'https'
+        verify_certs = True  # Always verify certificates unless you have a specific reason not to
+
         try:
+            # Initialize the OpenSearch client
             self.opensearch_client = OpenSearch(
                 hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
-                use_ssl=parsed_url.scheme == 'https',
-                verify_certs=False if parsed_url.scheme == 'https' else True,
+                use_ssl=use_ssl,
+                verify_certs=verify_certs,
+                ssl_show_warn=False,          # Suppress SSL warnings
+                # ssl_context=ssl_context,      # Not needed unless you have custom certificates
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
             print(f"Initialized OpenSearch client with host: {host} and port: {port}")
             return True
         except Exception as ex:
+            # Handle initialization errors
             print(f"Error initializing OpenSearch client: {ex}")
             return False
 
-    def create_index(self, embedding_dimension, space_type):
+
+    def create_index(self, embedding_dimension: int, space_type: str, ef_construction: int,
+                    number_of_shards: int, number_of_replicas: int,
+                    passage_text_field: str, passage_chunk_field: str, embedding_field: str):
+        """
+            Create a KNN index in OpenSearch with the specified parameters.
+
+            :param embedding_dimension: The dimension of the embedding vectors.
+            :param space_type: The space type for the KNN algorithm (e.g., 'cosinesimil', 'l2').
+            :param ef_construction: ef_construction parameter for KNN
+            :param number_of_shards: Number of shards for the index
+            :param number_of_replicas: Number of replicas for the index
+            :param nominee_text_field: Field name for nominee text
+        """
+        # Define the index mapping and settings
         index_body = {
             "mappings": {
                 "properties": {
-                    "nominee_text": {"type": "text"},
-                    "passage_chunk": {"type": "text"},
-                    "nominee_vector": {
-                        "type": "knn_vector",
-                        "dimension": embedding_dimension,
-                        "method": {
-                            "name": "hnsw",
-                            "space_type": space_type,
-                            "engine": "nmslib",
-                            "parameters": {"ef_construction": 512, "m": 16},
-                        },
-                    },
+                    passage_text_field: {"type": "text"},
+                    passage_chunk_field: {"type": "text"},
+                    embedding_field: {
+                        "type": "nested",
+                        "properties": {
+                            "knn": {
+                                "type": "knn_vector",
+                                "dimension": embedding_dimension
+                            }
+                        }
+                    }
                 }
             },
             "settings": {
                 "index": {
-                    "number_of_shards": 2,
+                    "number_of_shards": number_of_shards,
+                    "number_of_replicas": number_of_replicas,
                     "knn.algo_param": {"ef_search": 512},
                     "knn": True,
                 }
             },
         }
+
         try:
+            # Attempt to create the index
             self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with dimension {embedding_dimension} and space type {space_type}.")
+            print(f"KNN index '{self.index_name}' created successfully with the following settings:")
+            print(f"Embedding Dimension: {embedding_dimension}")
+            print(f"Space Type: {space_type}")
+            print(f"ef_construction: {ef_construction}")
+            print(f"Number of Shards: {number_of_shards}")
+            print(f"Number of Replicas: {number_of_replicas}")
+            print(f"Text Field: '{passage_text_field}'")
+            print(f"Passage Chunk Field: '{passage_chunk_field}'")
+            print(f"Embedding Field: '{embedding_field}'")
         except opensearch_exceptions.RequestError as e:
+            # Handle cases where the index already exists
             if 'resource_already_exists_exception' in str(e).lower():
                 print(f"Index '{self.index_name}' already exists.")
             else:
+                # Handle other index creation errors
                 print(f"Error creating index '{self.index_name}': {e}")
 
-    def verify_and_create_index(self, embedding_dimension, space_type):
-        # Check if the index exists, create it if it doesn't
-        # Returns True if the index exists or was successfully created, False otherwise
+    def verify_and_create_index(self, embedding_dimension: int, space_type: str, ef_construction: int,
+                                number_of_shards: int, number_of_replicas: int,
+                                passage_text_field: str, passage_chunk_field: str, embedding_field: str) -> bool:
+        """
+        Verify if the index exists; if not, create it.
+
+        :param embedding_dimension: The dimension of the embedding vectors.
+        :param space_type: The space type for the KNN algorithm.
+        :param ef_construction: ef_construction parameter for KNN
+        :param number_of_shards: Number of shards for the index
+        :param number_of_replicas: Number of replicas for the index
+        :param nominee_text_field: Field name for nominee text
+        :return: True if the index exists or was successfully created, False otherwise.
+        """
         try:
+            # Check if the index already exists
             index_exists = self.opensearch_client.indices.exists(index=self.index_name)
             if index_exists:
                 print(f"KNN index '{self.index_name}' already exists.")
             else:
-                self.create_index(embedding_dimension, space_type)
+                # Create the index if it doesn't exist
+                self.create_index(embedding_dimension, space_type, ef_construction,
+                                number_of_shards, number_of_replicas, passage_text_field, passage_chunk_field, embedding_field)
             return True
         except Exception as ex:
+            # Handle errors during verification or creation
             print(f"Error verifying or creating index: {ex}")
             return False
 
-    def bulk_index(self, actions):
-        # Perform bulk indexing of documents
-        # Returns the number of successfully indexed documents and the number of failures
+    def bulk_index(self, actions: list) -> tuple:
+        """
+        Perform bulk indexing of documents into OpenSearch.
+
+        :param actions: List of indexing actions to perform.
+        :return: A tuple containing the number of successfully indexed documents and the number of failures.
+        """
         try:
+            # Execute bulk indexing using OpenSearch helpers
             success_count, error_info = opensearch_helpers.bulk(self.opensearch_client, actions)
             error_count = len(error_info)
             print(f"Indexed {success_count} documents successfully. Failed to index {error_count} documents.")
             return success_count, error_count
         except Exception as e:
+            # Handle bulk indexing errors
             print(f"Error during bulk indexing: {e}")
             return 0, len(actions)
 
-    def search(self, query_text, model_id, k=5):
+    def search(self, query_text: str, model_id: str, k: int = 5) -> list:
+        """
+        Perform a neural search based on the query text and model ID.
+        """
+        embedding_field = self.config.get('embedding_field', 'passage_embedding')
+
         try:
+            # Execute the search query using nested query
             response = self.opensearch_client.search(
                 index=self.index_name,
                 body={
                     "size": k,
                     "_source": ["passage_chunk"],
                     "query": {
-                        "neural": {
-                            "nominee_vector": {
-                                "query_text": query_text,
-                                "model_id": model_id,
-                                "k": k
+                        "nested": {
+                            "score_mode": "max",
+                            "path": embedding_field,
+                            "query": {
+                                "neural": {
+                                    f"{embedding_field}.knn": {
+                                        "query_text": query_text,
+                                        "model_id": model_id,
+                                        "k": k
+                                    }
+                                }
                             }
                         }
                     }
@@ -163,20 +235,35 @@ def search(self, query_text, model_id, k=5):
             )
             return response['hits']['hits']
         except Exception as e:
+            # Handle search errors
             print(f"Error during search: {e}")
             return []
 
-    def check_connection(self):
+    def check_connection(self) -> bool:
+        """
+        Check the connection to the OpenSearch cluster.
+
+        :return: True if the connection is successful, False otherwise.
+        """
         try:
+            # Retrieve cluster information to verify connection
             self.opensearch_client.info()
             return True
         except Exception as e:
+            # Handle connection errors
             print(f"Error connecting to OpenSearch: {e}")
             return False
-        
 
-    def search_by_vector(self, vector, k=5):
+    def search_by_vector(self, vector: list, k: int = 5) -> list:
+        """
+        Perform a vector-based search using the provided embedding vector.
+
+        :param vector: The embedding vector to search with.
+        :param k: The number of top results to retrieve.
+        :return: A list of search hits.
+        """
         try:
+            # Execute the KNN search query
             response = self.opensearch_client.search(
                 index=self.index_name,
                 body={
@@ -194,5 +281,6 @@ def search_by_vector(self, vector, k=5):
             )
             return response['hits']['hits']
         except Exception as e:
+            # Handle search errors
             print(f"Error during search: {e}")
             return []
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 45f5e175..4881405b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -5,27 +5,11 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import json
 from colorama import Fore, Style, init
 from typing import List
-from opensearch_connector import OpenSearchConnector
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import EmbeddingClient
 import requests
 import os
 import urllib3
@@ -33,13 +17,26 @@
 import time
 import tiktoken
 
+# Disable insecure request warnings
 urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
 
+# Initialize colorama for colored terminal output
 init(autoreset=True)  # Initialize colorama
 
+
 class Query:
+    """
+    Handles querying operations using OpenSearch and integrates with Large Language Models (LLMs) for generating responses.
+    Supports both neural and semantic search methods.
+    """
+
     def __init__(self, config):
-        # Initialize the Query class with configuration
+        """
+        Initialize the Query class with the provided configuration.
+
+        :param config: Configuration dictionary containing necessary parameters.
+        """
+        # Store the configuration
         self.config = config
         self.index_name = config.get('index_name')
         self.opensearch = OpenSearchConnector(config)
@@ -47,9 +44,7 @@ def __init__(self, config):
         self.llm_model_id = config.get('llm_model_id')  # Get the LLM model ID from config
         self.aws_region = config.get('region')
         self.bedrock_client = None
-
-        # Initialize the default search method from config
-        self.default_search_method = self.config.get('default_search_method', 'neural')
+        self.embedding_client = None  # Will be initialized after OpenSearch client is ready
 
         # Load LLM configurations from config
         self.llm_config = {
@@ -59,7 +54,10 @@ def __init__(self, config):
             "stopSequences": [s.strip() for s in config.get('llm_stop_sequences', '').split(',') if s.strip()]
         }
 
-        # Initialize OpenSearch client
+        # Set the default search method
+        self.default_search_method = self.config.get('default_search_method', 'neural')
+
+        # Initialize clients
         if not self.initialize_clients():
             print("Failed to initialize clients. Aborting.")
             return
@@ -69,24 +67,44 @@ def __init__(self, config):
             print("Failed to connect to OpenSearch. Please check your configuration.")
             return
 
-    def initialize_clients(self):
-        # Initialize OpenSearch client and Bedrock client if needed
+    def initialize_clients(self) -> bool:
+        """
+        Initialize the OpenSearch client and Bedrock client if LLM is configured.
+
+        :return: True if clients are initialized successfully, False otherwise.
+        """
+        # Initialize OpenSearch client
         if self.opensearch.initialize_opensearch_client():
             print("OpenSearch client initialized successfully.")
-            # Initialize Bedrock client only if needed
+
+            # Initialize EmbeddingClient now that OpenSearch client is ready
+            if not self.embedding_model_id:
+                print("Embedding model ID is not set. Please run setup first.")
+                return False
+
+            self.embedding_client = EmbeddingClient(self.opensearch.opensearch_client, self.embedding_model_id)
+
+            # Initialize Bedrock client only if LLM model ID is provided
             if self.llm_model_id:
                 try:
                     self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
                     print("Bedrock client initialized successfully.")
                 except Exception as e:
-                    print(f"Failed to initialize Bedrock client: {e}")
+                    print(f"{Fore.RED}Failed to initialize Bedrock client: {e}{Style.RESET_ALL}")
                     return False
             return True
         else:
-            print("Failed to initialize OpenSearch client.")
+            print(f"{Fore.RED}Failed to initialize OpenSearch client.{Style.RESET_ALL}")
             return False
 
-    def extract_relevant_sentences(self, query, text):
+    def extract_relevant_sentences(self, query: str, text: str) -> List[str]:
+        """
+        Extract relevant sentences from the text based on the query.
+
+        :param query: The user's query.
+        :param text: The text from which to extract sentences.
+        :return: A list of relevant sentences.
+        """
         # Lowercase and remove punctuation from query
         query_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in query)
         query_words = set(query_processed.split())
@@ -115,10 +133,18 @@ def extract_relevant_sentences(self, query, text):
         top_sentences = [sentence for score, sentence in sentence_scores]
         return top_sentences
 
-    def bulk_query_neural(self, queries, k=5):
+    def bulk_query_neural(self, queries: List[str], k: int = 5) -> List[dict]:
+        """
+        Perform bulk neural searches for a list of queries.
+
+        :param queries: List of query strings.
+        :param k: Number of top results to retrieve per query.
+        :return: List of results containing query, documents, and number of results.
+        """
         results = []
         for query_text in queries:
             try:
+                # Perform search using the neural method
                 hits = self.opensearch.search(query_text, self.embedding_model_id, k)
                 if hits:
                     # Collect the content from the retrieved documents
@@ -142,6 +168,7 @@ def bulk_query_neural(self, queries, k=5):
                     'num_results': num_results
                 })
             except Exception as ex:
+                # Handle search errors
                 print(f"{Fore.RED}Error performing search for query '{query_text}': {str(ex)}{Style.RESET_ALL}")
                 results.append({
                     'query': query_text,
@@ -151,12 +178,19 @@ def bulk_query_neural(self, queries, k=5):
 
         return results
 
-    def bulk_query_semantic(self, queries, k=5):
+    def bulk_query_semantic(self, queries: List[str], k: int = 5) -> List[dict]:
+        """
+        Perform bulk semantic searches for a list of queries by generating embeddings.
+
+        :param queries: List of query strings.
+        :param k: Number of top results to retrieve per query.
+        :return: List of results containing query, context, and number of results.
+        """
         # Generate embeddings for queries and search OpenSearch index
         # Returns a list of results containing query, context, and number of results
         query_vectors = []
         for query in queries:
-            embedding = self.text_embedding(query)
+            embedding = self.embedding_client.get_text_embedding(query)
             if embedding:
                 query_vectors.append(embedding)
             else:
@@ -166,6 +200,7 @@ def bulk_query_semantic(self, queries, k=5):
         results = []
         for i, vector in enumerate(query_vectors):
             if vector is None:
+                # Handle cases where embedding generation failed
                 results.append({
                     'query': queries[i],
                     'context': "",
@@ -173,7 +208,9 @@ def bulk_query_semantic(self, queries, k=5):
                 })
                 continue
             try:
+                # Perform vector-based search
                 hits = self.opensearch.search_by_vector(vector, k)
+                # Concatenate the retrieved passages as context
                 context = '\n'.join([hit['_source']['nominee_text'] for hit in hits])
                 results.append({
                     'query': queries[i],
@@ -181,6 +218,7 @@ def bulk_query_semantic(self, queries, k=5):
                     'num_results': len(hits)
                 })
             except Exception as ex:
+                # Handle search errors
                 print(f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}")
                 results.append({
                     'query': queries[i],
@@ -189,66 +227,22 @@ def bulk_query_semantic(self, queries, k=5):
                 })
         return results
 
-    def text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
-        if self.opensearch.opensearch_client is None:
-            print("OpenSearch client is not initialized. Please run setup first.")
-            return None
-
-        delay = initial_delay
-        for attempt in range(max_retries):
-            try:
-                payload = {
-                    "text_docs": [text]
-                }
-                response = self.opensearch.opensearch_client.transport.perform_request(
-                    method="POST",
-                    url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
-                    body=payload
-                )
-                inference_results = response.get('inference_results', [])
-                if not inference_results:
-                    print(f"No inference results returned for text: {text}")
-                    return None
-                output = inference_results[0].get('output')
-
-                # Adjust the extraction of embedding data
-                if isinstance(output, list) and len(output) > 0:
-                    embedding_dict = output[0]
-                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
-                        embedding = embedding_dict['data']
-                    else:
-                        print(f"Unexpected embedding output format: {output}")
-                        return None
-                elif isinstance(output, dict) and 'data' in output:
-                    embedding = output['data']
-                else:
-                    print(f"Unexpected embedding output format: {output}")
-                    return None
 
-                # Verify that embedding is a list of floats
-                if not isinstance(embedding, list) or not all(isinstance(x, (float, int)) for x in embedding):
-                    print(f"Embedding is not a list of floats: {embedding}")
-                    return None
+    def generate_answer(self, prompt: str, llm_config: dict) -> str:
+        """
+        Generate an answer using the configured Large Language Model (LLM).
 
-                return embedding
-            except Exception as ex:
-                print(f"Error on attempt {attempt + 1}: {ex}")
-                if attempt == max_retries - 1:
-                    raise
-                time.sleep(delay)
-                delay *= backoff_factor
-        return None
-
-    def generate_answer(self, prompt, llm_config):
-        # Generate an answer using the LLM model
-        # Handles token limit and configures LLM parameters
-        # Returns the generated answer or None if an error occurs
+        :param prompt: The prompt to send to the LLM.
+        :param llm_config: Configuration dictionary for the LLM parameters.
+        :return: Generated answer as a string or None if generation fails.
+        """
         try:
             max_input_tokens = 8192  # Max tokens for the model
             expected_output_tokens = llm_config.get('maxTokenCount', 1000)
             # Adjust the encoding based on the model
             encoding = tiktoken.get_encoding("cl100k_base")  # Use appropriate encoding
 
+            # Encode the prompt to count tokens
             prompt_tokens = encoding.encode(prompt)
             allowable_input_tokens = max_input_tokens - expected_output_tokens
 
@@ -256,40 +250,52 @@ def generate_answer(self, prompt, llm_config):
                 # Truncate the prompt to fit within the model's token limit
                 prompt_tokens = prompt_tokens[:allowable_input_tokens]
                 prompt = encoding.decode(prompt_tokens)
-                print(f"Prompt truncated to {allowable_input_tokens} tokens.")
+                print(f"{Fore.YELLOW}Prompt truncated to {allowable_input_tokens} tokens.{Style.RESET_ALL}")
 
             # Simplified LLM config with only supported parameters
-            llm_config = {
+            llm_config_simplified = {
                 'maxTokenCount': expected_output_tokens,
                 'temperature': llm_config.get('temperature', 0.7),
                 'topP': llm_config.get('topP', 1.0),
                 'stopSequences': llm_config.get('stopSequences', [])
             }
 
+            # Prepare the body for the LLM inference request
             body = json.dumps({
                 'inputText': prompt,
-                'textGenerationConfig': llm_config
+                'textGenerationConfig': llm_config_simplified
             })
+
+            # Invoke the LLM model using Bedrock client
             response = self.bedrock_client.invoke_model(modelId=self.llm_model_id, body=body)
             response_body = json.loads(response['body'].read())
             results = response_body.get('results', [])
             if not results:
-                print("No results returned from LLM.")
+                print(f"{Fore.YELLOW}No results returned from LLM.{Style.RESET_ALL}")
                 return None
             answer = results[0].get('outputText', '').strip()
             return answer
         except Exception as ex:
-            print(f"Error generating answer from LLM: {ex}")
+            # Handle errors during answer generation
+            print(f"{Fore.RED}Error generating answer from LLM: {ex}{Style.RESET_ALL}")
             return None
 
-    def query_command(self, queries: List[str], num_results=5):
+    def query_command(self, queries: List[str], num_results: int = 5):
+        """
+        Handle the querying process by performing either neural or semantic searches and generating answers using LLM.
+
+        :param queries: List of query strings.
+        :param num_results: Number of top results to retrieve per query.
+        """
+        # Retrieve the default search method from config
         search_method = self.default_search_method
 
         print(f"\nUsing the default search method: {search_method.capitalize()} Search")
 
-        # Keep the session active until the user types 'exit' or presses Enter without input
+        # Process each query until the user decides to exit
         while True:
             if not queries:
+                # Prompt the user for a new query
                 query_text = input("\nEnter a query (or type 'exit' to finish): ").strip()
                 if not query_text or query_text.lower() == 'exit':
                     print("\nExiting query session.")
@@ -309,6 +315,7 @@ def query_command(self, queries: List[str], num_results=5):
                             if not passage_chunks:
                                 continue
                             for passage in passage_chunks:
+                                # Extract relevant sentences from each passage
                                 relevant_sentences = self.extract_relevant_sentences(result['query'], passage)
                                 all_relevant_sentences.extend(relevant_sentences)
 
@@ -330,16 +337,17 @@ def query_command(self, queries: List[str], num_results=5):
                 # Use the LLM configurations from setup
                 llm_config = self.llm_config
 
+                # Perform semantic search
                 results = self.bulk_query_semantic(queries, k=num_results)
 
                 for result in results:
                     print(f"\nQuery: {result['query']}")
-                    print(f"Found {result['num_results']} results.")
 
                     if not result['context']:
                         print(f"\n{Fore.RED}No context available for this query.{Style.RESET_ALL}")
                         continue
 
+                    # Prepare the augmented prompt with context
                     augmented_prompt = f"""Context: {result['context']}
 Based on the above context, please provide a detailed and insightful answer to the following question. Feel free to make reasonable inferences or connections if the context doesn't provide all the information:
 
@@ -348,9 +356,11 @@ def query_command(self, queries: List[str], num_results=5):
 Answer:"""
 
                     print("\nGenerating answer using LLM...")
+                    # Generate the answer using the LLM
                     answer = self.generate_answer(augmented_prompt, llm_config)
 
                     if answer:
+                        # Display the generated answer
                         print("\nGenerated Answer:")
                         print(answer)
                     else:
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 39e98617..35b7fb2b 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -2,25 +2,9 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors.
-# See GitHub history for details.
-
-# Licensed to Elasticsearch B.V. under one or more contributor
-# license agreements. See the NOTICE file distributed with
-# this work for additional information regarding copyright
-# ownership. Elasticsearch B.V. licenses this file to you under
-# the Apache License, Version 2.0 (the "License"); you may
-# not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for
-# the specific language governing permissions and limitations
-# under the License.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
 """
 Main CLI script for OpenSearch PY ML
 """
@@ -31,22 +15,25 @@
 from colorama import Fore, Style, init
 from rich.console import Console
 from rich.prompt import Prompt
-from rag_setup import Setup
-from ingest import Ingest
-from query import Query
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup import Setup
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest import Ingest
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.query import Query
 
-# Initialize colorama
+# Initialize colorama for colored terminal output
 init(autoreset=True)
 
-# Initialize Rich console
+# Initialize Rich console for enhanced CLI outputs
 console = Console()
 
+# Configuration file name
 CONFIG_FILE = 'config.ini'
 
 
-def load_config():
+def load_config() -> dict:
     """
     Load configuration from the config file.
+
+    :return: Dictionary of configuration parameters.
     """
     config = configparser.ConfigParser()
     config.read(CONFIG_FILE)
@@ -56,9 +43,11 @@ def load_config():
     return config['DEFAULT']
 
 
-def save_config(config):
+def save_config(config: dict):
     """
     Save configuration to the config file.
+
+    :param config: Dictionary of configuration parameters.
     """
     parser = configparser.ConfigParser()
     parser['DEFAULT'] = config
@@ -137,7 +126,7 @@ def main():
         console.print("[bold cyan]Welcome to the RAG Pipeline[/bold cyan]")
         console.print("Use [bold blue]rag setup[/bold blue], [bold blue]rag ingest[/bold blue], or [bold blue]rag query[/bold blue] to begin.\n")
 
-    # Load existing configuration
+    # Load existing configuration if not running setup
     if args.command != 'setup' and args.command:
         config = load_config()
     else:
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 623a4922..33a30621 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import boto3
 import botocore
 from botocore.config import Config
@@ -38,19 +21,31 @@
 from colorama import Fore, Style, init
 import ssl
 
-from serverless import Serverless  
-from AIConnectorHelper import AIConnectorHelper 
-from model_register import ModelRegister
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless  
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper 
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
 
+# Initialize colorama for colored terminal output
 init(autoreset=True)
 
+
 class Setup:
+    """
+    Handles the setup and configuration of the OpenSearch environment.
+    Manages AWS credentials, OpenSearch client initialization, index creation,
+    and model registration.
+    """
+    
     CONFIG_FILE = 'config.ini'
     SERVICE_AOSS = 'opensearchserverless'
     SERVICE_BEDROCK = 'bedrock-runtime'
 
     def __init__(self):
-        # Initialize setup variables
+        """
+        Initialize the Setup class with default or existing configurations.
+        """
+        # Load existing configuration
         self.config = self.load_config()
         self.aws_region = self.config.get('region', 'us-west-2')
         self.iam_principal = self.config.get('iam_principal', '')
@@ -94,10 +89,11 @@ def configure_aws(self):
         print("Let's configure your AWS credentials.")
 
         aws_access_key_id = input("Enter your AWS Access Key ID: ").strip()
-        aws_secret_access_key = input("Enter your AWS Secret Access Key: ").strip()
-        aws_region_input = input("Enter your preferred AWS region (e.g., us-west-2): ").strip()
+        aws_secret_access_key = self.get_password_with_asterisks("Enter your AWS Secret Access Key: ")
+        aws_region_input = input(f"Enter your preferred AWS region [{self.aws_region}]: ").strip() or self.aws_region
 
         try:
+            # Configure AWS credentials using subprocess to call AWS CLI
             subprocess.run([
                 'aws', 'configure', 'set', 
                 'aws_access_key_id', aws_access_key_id
@@ -119,7 +115,7 @@ def configure_aws(self):
         except Exception as e:
             print(f"{Fore.RED}An unexpected error occurred: {e}{Style.RESET_ALL}")
 
-    def load_config(self):
+    def load_config(self) -> dict:
         """
         Load configuration from the config file.
 
@@ -131,7 +127,7 @@ def load_config(self):
             return dict(config['DEFAULT'])
         return {}
 
-    def get_password_with_asterisks(self, prompt="Enter password: "):
+    def get_password_with_asterisks(self, prompt="Enter password: ") -> str:
         """
         Get password input from user, masking it with asterisks.
 
@@ -153,9 +149,13 @@ def get_password_with_asterisks(self, prompt="Enter password: "):
                         sys.stdout.write('\b \b')  # Erase the last asterisk
                         sys.stdout.flush()
                 else:
-                    password += key.decode('utf-8')
-                    sys.stdout.write('*')  # Mask input with '*'
-                    sys.stdout.flush()
+                    try:
+                        char = key.decode('utf-8')
+                        password += char
+                        sys.stdout.write('*')  # Mask input with '*'
+                        sys.stdout.flush()
+                    except UnicodeDecodeError:
+                        continue
         else:
             import termios, tty
             fd = sys.stdin.fileno()
@@ -188,7 +188,6 @@ def setup_configuration(self):
         """
         config = self.load_config()
 
-        print("\nStarting setup process...")
 
         # First, prompt for service type
         print("\nChoose OpenSearch service type:")
@@ -336,7 +335,7 @@ def setup_configuration(self):
         print(f"\n{Fore.GREEN}Configuration saved successfully to {os.path.abspath(self.CONFIG_FILE)}.{Style.RESET_ALL}\n")
 
 
-    def initialize_clients(self):
+    def initialize_clients(self) -> bool:
         """
         Initialize AWS clients (AOSS and Bedrock) only if not open-source.
 
@@ -352,17 +351,20 @@ def initialize_clients(self):
                 retries={'max_attempts': 10, 'mode': 'standard'}
             )
             if self.is_serverless:
+                # Initialize AOSS client for serverless service
                 self.aoss_client = boto3.client(self.SERVICE_AOSS, config=boto_config)
+            # Initialize Bedrock client for managed or serverless services
             self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region)
             
             time.sleep(7)  # Wait for clients to initialize
             print(f"{Fore.GREEN}AWS clients initialized successfully.{Style.RESET_ALL}\n")
             return True
         except Exception as e:
+            # Handle initialization errors
             print(f"{Fore.RED}Failed to initialize AWS clients: {e}{Style.RESET_ALL}")
             return False
 
-    def get_opensearch_domain_name(self):
+    def get_opensearch_domain_name(self) -> str:
         """
         Extract the domain name from the OpenSearch endpoint URL.
 
@@ -385,7 +387,7 @@ def get_opensearch_domain_name(self):
         return None
 
     @staticmethod
-    def get_opensearch_domain_info(region, domain_name):
+    def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
 
@@ -404,7 +406,13 @@ def get_opensearch_domain_info(region, domain_name):
             print(f"{Fore.RED}Error retrieving OpenSearch domain info: {e}{Style.RESET_ALL}")
             return None, None
 
-    def initialize_opensearch_client(self):
+# In Setup class, modify the initialize_opensearch_client method
+    def initialize_opensearch_client(self) -> bool:
+        """
+        Initialize the OpenSearch client based on the service type and configuration.
+
+        :return: True if the client is initialized successfully, False otherwise.
+        """
         if not self.opensearch_endpoint:
             print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
             return False
@@ -413,6 +421,7 @@ def initialize_opensearch_client(self):
         host = parsed_url.hostname
         port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
+        # Determine the authentication method based on the service type
         if self.service_type == 'serverless':
             credentials = boto3.Session().get_credentials()
             auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
@@ -430,42 +439,90 @@ def initialize_opensearch_client(self):
             print("Invalid service type. Please check your configuration.")
             return False
 
+        # Determine SSL settings based on the endpoint scheme
         use_ssl = parsed_url.scheme == 'https'
-        verify_certs = False if use_ssl else True
+        verify_certs = True  # Always verify certificates unless you have a specific reason not to
+
+        try:
+            # Initialize the OpenSearch client
+            self.opensearch_client = OpenSearch(
+                hosts=[{'host': host, 'port': port}],
+                http_auth=auth,
+                use_ssl=use_ssl,
+                verify_certs=verify_certs,
+                ssl_show_warn=False,          # Suppress SSL warnings
+                # ssl_context=ssl_context,      # Not needed unless you have custom certificates
+                connection_class=RequestsHttpConnection,
+                pool_maxsize=20
+            )
+            print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
+            return True
+        except Exception as ex:
+            # Handle initialization errors
+            print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
+            return False
+
+    def initialize_opensearch_client(self) -> bool:
+        """
+        Initialize the OpenSearch client based on the service type and configuration.
+
+        :return: True if the client is initialized successfully, False otherwise.
+        """
+        if not self.opensearch_endpoint:
+            print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
+            return False
+
+        parsed_url = urlparse(self.opensearch_endpoint)
+        host = parsed_url.hostname
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
 
-        # Create an SSL context that does not verify certificates if needed
-        if use_ssl and not verify_certs:
-            ssl_context = ssl.create_default_context()
-            ssl_context.check_hostname = False
-            ssl_context.verify_mode = ssl.CERT_NONE
+        # Determine the authentication method based on the service type
+        if self.service_type == 'serverless':
+            credentials = boto3.Session().get_credentials()
+            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
+        elif self.service_type == 'managed':
+            if not self.opensearch_username or not self.opensearch_password:
+                print(f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n")
+                return False
+            auth = (self.opensearch_username, self.opensearch_password)
+        elif self.service_type == 'open-source':
+            if self.opensearch_username and self.opensearch_password:
+                auth = (self.opensearch_username, self.opensearch_password)
+            else:
+                auth = None  # No authentication
         else:
-            ssl_context = None
+            print("Invalid service type. Please check your configuration.")
+            return False
+
+        # Determine SSL settings based on the endpoint scheme
+        use_ssl = parsed_url.scheme == 'https'
+        verify_certs = True  # Always verify certificates unless you have a specific reason not to
 
         try:
+            # Initialize the OpenSearch client
             self.opensearch_client = OpenSearch(
                 hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
                 use_ssl=use_ssl,
                 verify_certs=verify_certs,
                 ssl_show_warn=False,          # Suppress SSL warnings
-                ssl_context=ssl_context,      # Use the custom SSL context
+                # ssl_context=ssl_context,      # Not needed unless you have custom certificates
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
             print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
             return True
         except Exception as ex:
+            # Handle initialization errors
             print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
             return False
-        
-    def get_knn_index_details(self):
-        """
-        Prompt user for KNN index details (embedding dimension, space type, and ef_construction).
 
-        :return: Tuple of (embedding_dimension, space_type, ef_construction)
+    def get_knn_index_details(self) -> tuple:
+        """
+        Prompt user for KNN index details (embedding dimension, space type, ef_construction,
+        number of shards, number of replicas, and field names).
         """
         dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ").strip()
-        
         if dimension_input == "":
             embedding_dimension = 768
         else:
@@ -477,6 +534,7 @@ def get_knn_index_details(self):
 
         print(f"\nEmbedding dimension set to: {embedding_dimension}")
 
+        # Prompt for space type
         print("\nChoose the space type for KNN:")
         print("1. L2 (Euclidean distance)")
         print("2. Cosine similarity")
@@ -495,9 +553,8 @@ def get_knn_index_details(self):
 
         print(f"Space type set to: {space_type}")
 
-        # New prompt for ef_construction
+        # Prompt for ef_construction
         ef_construction_input = input("\nPress Enter to use the default ef_construction value (512), or type a custom value: ").strip()
-        
         if ef_construction_input == "":
             ef_construction = 512
         else:
@@ -509,8 +566,51 @@ def get_knn_index_details(self):
 
         print(f"ef_construction set to: {ef_construction}\n")
 
-        return embedding_dimension, space_type, ef_construction
-    def save_config(self, config):
+        # Prompt for number of shards
+        shards_input = input("\nEnter number of shards (Press Enter for default value 2): ").strip()
+        if shards_input == "":
+            number_of_shards = 2
+        else:
+            try:
+                number_of_shards = int(shards_input)
+            except ValueError:
+                print("Invalid input. Using default number of shards: 2.")
+                number_of_shards = 2
+        print(f"Number of shards set to: {number_of_shards}")
+
+        # Prompt for number of replicas
+        replicas_input = input("\nEnter number of replicas (Press Enter for default value 2): ").strip()
+        if replicas_input == "":
+            number_of_replicas = 2
+        else:
+            try:
+                number_of_replicas = int(replicas_input)
+            except ValueError:
+                print("Invalid input. Using default number of replicas: 2.")
+                number_of_replicas = 2
+        print(f"Number of replicas set to: {number_of_replicas}")
+
+        # Prompt for passage_text field name
+        passage_text_field = input("\nEnter the field name for text content (Press Enter for default 'passage_text'): ").strip()
+        if passage_text_field == "":
+            passage_text_field = "passage_text"
+        print(f"Text content field name set to: {passage_text_field}")
+
+        # Prompt for passage_chunk field name
+        passage_chunk_field = input("\nEnter the field name for passage chunks (Press Enter for default 'passage_chunk'): ").strip()
+        if passage_chunk_field == "":
+            passage_chunk_field = "passage_chunk"
+        print(f"Passage chunk field name set to: {passage_chunk_field}")
+
+        # Prompt for embedding field name
+        embedding_field = input("\nEnter the field name for embeddings (Press Enter for default 'passage_embedding'): ").strip()
+        if embedding_field == "":
+            embedding_field = "passage_embedding"
+        print(f"Embedding field name set to: {embedding_field}")
+
+        return embedding_dimension, space_type, ef_construction, number_of_shards, number_of_replicas, passage_text_field, passage_chunk_field, embedding_field
+
+    def save_config(self, config: dict):
         """
         Save configuration to the config file.
 
@@ -521,73 +621,7 @@ def save_config(self, config):
         config_path = os.path.abspath(self.CONFIG_FILE)
         with open(self.CONFIG_FILE, 'w') as f:
             parser.write(f)
-        # Removed duplicate message
-        # Only one message is printed where this method is called
-    def create_index(self, embedding_dimension, space_type, ef_construction):
-        """
-        Create the KNN index in OpenSearch.
-
-        :param embedding_dimension: Dimension of the embedding vectors
-        :param space_type: Type of space for KNN
-        :param ef_construction: ef_construction parameter for KNN
-        """
-        index_body = {
-            "mappings": {
-                "properties": {
-                    "nominee_text": {"type": "text"},
-                    "nominee_vector": {
-                        "type": "knn_vector",
-                        "dimension": embedding_dimension,
-                        "method": {
-                            "name": "hnsw",
-                            "space_type": space_type,
-                            "engine": "nmslib",
-                            "parameters": {"ef_construction": ef_construction, "m": 16},
-                        },
-                    },
-                }
-            },
-            "settings": {
-                "index": {
-                    "number_of_shards": 2,
-                    "knn.algo_param": {"ef_search": 512},
-                    "knn": True,
-                }
-            },
-        }
-        try:
-            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully with dimension {embedding_dimension}, space type {space_type}, and ef_construction {ef_construction}.{Style.RESET_ALL}\n")
-        except Exception as e:
-            if 'resource_already_exists_exception' in str(e).lower():
-                print(f"\n{Fore.YELLOW}Index '{self.index_name}' already exists.{Style.RESET_ALL}\n")
-            else:
-                print(f"\n{Fore.RED}Error creating index '{self.index_name}': {e}{Style.RESET_ALL}\n")
-
-    def verify_and_create_index(self, embedding_dimension, space_type, ef_construction):
-        """
-        Verify if the index exists; if not, create it.
-
-        :param embedding_dimension: Dimension of the embedding vectors
-        :param space_type: Type of space for KNN
-        :param ef_construction: ef_construction parameter for KNN
-        :return: True if index exists or is created successfully, False otherwise
-        """
-        try:
-            print(f"Attempting to verify index '{self.index_name}'...")
-            index_exists = self.opensearch_client.indices.exists(index=self.index_name)
-            if index_exists:
-                print(f"{Fore.GREEN}KNN index '{self.index_name}' already exists.{Style.RESET_ALL}\n")
-            else:
-                print(f"{Fore.YELLOW}Index '{self.index_name}' does not exist. Attempting to create...{Style.RESET_ALL}\n")
-                self.create_index(embedding_dimension, space_type, ef_construction)
-            return True
-        except Exception as ex:
-            print(f"{Fore.RED}Error verifying or creating index: {ex}{Style.RESET_ALL}")
-            print(f"OpenSearch client config: {self.opensearch_client.transport.hosts}\n")
-            return False
-
-    def get_truncated_name(self, base_name, max_length=32):
+    def get_truncated_name(self, base_name: str, max_length: int = 32) -> str:
         """
         Truncate a name to fit within a specified length.
 
@@ -603,6 +637,7 @@ def setup_command(self):
         """
         Main setup command that orchestrates the entire setup process.
         """
+        # Begin setup by configuring necessary parameters
         self.setup_configuration()
 
         if self.service_type != 'open-source' and not self.initialize_clients():
@@ -610,7 +645,7 @@ def setup_command(self):
             return
 
         if self.service_type == 'serverless':
-
+            # Serverless-specific setup can be added here if needed
             pass
         elif self.service_type == 'managed':
             if not self.opensearch_endpoint:
@@ -644,14 +679,29 @@ def setup_command(self):
                 self.save_config(self.config)
 
                 print("\nProceeding with index creation...\n")
-                embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
-
-                if self.verify_and_create_index(embedding_dimension, space_type, ef_construction):
+                embedding_dimension, space_type, ef_construction, number_of_shards, number_of_replicas, \
+                passage_text_field, passage_chunk_field, embedding_field = self.get_knn_index_details()
+
+                # Create an instance of OpenSearchConnector
+                self.opensearch_connector = OpenSearchConnector(self.config)
+                self.opensearch_connector.opensearch_client = self.opensearch_client  # Use the initialized client
+                self.opensearch_connector.index_name = self.index_name  # Set the index name
+
+                # Verify and create the index
+                if self.opensearch_connector.verify_and_create_index(
+                    embedding_dimension, space_type, ef_construction, number_of_shards,
+                    number_of_replicas, passage_text_field, passage_chunk_field, embedding_field
+                ):
                     print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
                     # Save index details to config
                     self.config['embedding_dimension'] = str(embedding_dimension)
                     self.config['space_type'] = space_type
                     self.config['ef_construction'] = str(ef_construction)
+                    self.config['number_of_shards'] = str(number_of_shards)
+                    self.config['number_of_replicas'] = str(number_of_replicas)
+                    self.config['passage_text_field'] = passage_text_field
+                    self.config['passage_chunk_field'] = passage_chunk_field
+                    self.config['embedding_field'] = embedding_field
                     self.save_config(self.config)
                 else:
                     print(f"\n{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
@@ -665,36 +715,56 @@ def setup_command(self):
                 self.index_name = existing_index_name
                 self.config['index_name'] = self.index_name
                 self.save_config(self.config)
-                # Load index details from config or prompt for them
-                if 'embedding_dimension' in self.config and 'space_type' in self.config and 'ef_construction' in self.config:
-                    try:
-                        embedding_dimension = int(self.config['embedding_dimension'])
-                        space_type = self.config['space_type']
-                        ef_construction = int(self.config['ef_construction'])
-                        print(f"\nUsing existing index '{self.index_name}' with embedding dimension {embedding_dimension}, space type '{space_type}', and ef_construction {ef_construction}.\n")
-                    except ValueError:
-                        print("\nInvalid index details in configuration. Prompting for details again.\n")
-                        embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
+
+                # Verify that the index exists
+                try:
+                    if not self.opensearch_client.indices.exists(index=self.index_name):
+                        print(f"\n{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
+                        return
+                    else:
+                        print(f"\n{Fore.GREEN}Index '{self.index_name}' exists in OpenSearch.{Style.RESET_ALL}\n")
+                        # Attempt to retrieve index settings and mappings
+                        index_info = self.opensearch_client.indices.get(index=self.index_name)
+                        settings = index_info[self.index_name]['settings']['index']
+                        mappings = index_info[self.index_name]['mappings']['properties']
+
+                        # Extract embedding dimension from the mapping
+                        embedding_field_mappings = mappings.get('passage_embedding', {})
+                        knn_mappings = embedding_field_mappings.get('properties', {}).get('knn', {})
+                        embedding_dimension = knn_mappings.get('dimension', 768)
+                        method = knn_mappings.get('method', {})
+                        space_type = method.get('space_type', 'l2')
+                        ef_construction = method.get('parameters', {}).get('ef_construction', 512)
+                        number_of_shards = settings.get('number_of_shards', '2')
+                        number_of_replicas = settings.get('number_of_replicas', '2')
+                        passage_text_field = 'passage_text'  # Assuming default, or you can extract if stored differently
+                        passage_chunk_field = 'passage_chunk'  # Assuming default
+                        embedding_field = 'passage_embedding'  # Assuming default
+
+                        print(f"\nUsing existing index '{self.index_name}' with the following settings:")
+                        print(f"Embedding Dimension: {embedding_dimension}")
+                        print(f"Space Type: {space_type}")
+                        print(f"ef_construction: {ef_construction}")
+                        print(f"Number of Shards: {number_of_shards}")
+                        print(f"Number of Replicas: {number_of_replicas}")
+                        print(f"Text Field: '{passage_text_field}'")
+                        print(f"Passage Chunk Field: '{passage_chunk_field}'")
+                        print(f"Embedding Field: '{embedding_field}'\n")
+
                         # Save index details to config
                         self.config['embedding_dimension'] = str(embedding_dimension)
                         self.config['space_type'] = space_type
                         self.config['ef_construction'] = str(ef_construction)
+                        self.config['number_of_shards'] = str(number_of_shards)
+                        self.config['number_of_replicas'] = str(number_of_replicas)
+                        self.config['passage_text_field'] = passage_text_field
+                        self.config['passage_chunk_field'] = passage_chunk_field
+                        self.config['embedding_field'] = embedding_field
                         self.save_config(self.config)
-                else:
-                    print("\nIndex details not found in configuration. Prompting for details.\n")
-                    embedding_dimension, space_type, ef_construction = self.get_knn_index_details()
-                    # Save index details to config
-                    self.config['embedding_dimension'] = str(embedding_dimension)
-                    self.config['space_type'] = space_type
-                    self.config['ef_construction'] = str(ef_construction)
-                    self.save_config(self.config)
-                # Verify that the index exists
-                if not self.opensearch_client.indices.exists(index=self.index_name):
-                    print(f"\n{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
+
+                except Exception as ex:
+                    print(f"\n{Fore.RED}Error retrieving index details: {ex}{Style.RESET_ALL}\n")
                     return
-            else:
-                print(f"\n{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}\n")
-                return
 
             # Proceed with model registration
             # Initialize ModelRegister now that OpenSearch client and domain name are available
@@ -712,4 +782,5 @@ def setup_command(self):
                 # Open-source OpenSearch: Provide instructions or automate model registration
                 self.model_register.prompt_opensource_model_registration()
         else:
+            # Handle failure to initialize OpenSearch client
             print(f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
index 7aa30969..4e0d8479 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import boto3
 import botocore
 import json

From d7e4713ea86133a39b07578ee95a7ae61d526773 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Wed, 4 Dec 2024 19:00:45 -0800
Subject: [PATCH 23/42] Correctly leveraged existing methods in AI connector
 class, without having method wrappers around them

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/AIConnectorHelper.py     | 66 ++++++-------------
 1 file changed, 20 insertions(+), 46 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index a915c74b..e4074faf 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -79,7 +79,7 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
     def get_opensearch_domain_info(region, domain_name):
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
-        
+
         :param region: AWS region.
         :param domain_name: Name of the OpenSearch domain.
         :return: Tuple containing domain endpoint and ARN.
@@ -98,7 +98,7 @@ def get_opensearch_domain_info(region, domain_name):
     def get_ml_auth(self, create_connector_role_name):
         """
         Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
-        
+
         :param create_connector_role_name: Name of the IAM role to assume.
         :return: AWS4Auth object with temporary credentials.
         """
@@ -119,7 +119,7 @@ def get_ml_auth(self, create_connector_role_name):
     def create_connector(self, create_connector_role_name, payload):
         """
         Create a connector in OpenSearch using the specified role and payload.
-        
+
         :param create_connector_role_name: Name of the IAM role to assume.
         :param payload: Payload data for creating the connector.
         :return: ID of the created connector.
@@ -144,46 +144,10 @@ def create_connector(self, create_connector_role_name, payload):
         connector_id = json.loads(response.text).get('connector_id')
         return connector_id
 
-    def search_model_group(self, model_group_name, create_connector_role_name):
-        """
-        Search for a model group by name using ModelAccessControl.
-        
-        :param model_group_name: Name of the model group to search.
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :return: Search response from OpenSearch.
-        """
-        response = self.model_access_control.search_model_group_by_name(model_group_name, size=1)
-        return response
-
-    def create_model_group(self, model_group_name, description, create_connector_role_name):
-        """
-        Create or retrieve an existing model group using ModelAccessControl.
-        
-        :param model_group_name: Name of the model group.
-        :param description: Description of the model group.
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :return: ID of the created or existing model group.
-        """
-        model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
-        print("Search Model Group Response:", model_group_id)
-
-        if model_group_id:
-            return model_group_id
-
-        # Register a new model group
-        self.model_access_control.register_model_group(name=model_group_name, description=description)
-        
-        # Retrieve the newly created model group ID
-        model_group_id = self.model_access_control.get_model_group_id_by_name(model_group_name)
-        if model_group_id:
-            return model_group_id
-        else:
-            raise Exception("Failed to create model group.")
-
     def get_task(self, task_id, create_connector_role_name):
         """
         Retrieve the status of a specific task using its ID.
-        
+
         :param task_id: ID of the task to retrieve.
         :param create_connector_role_name: Name of the IAM role to assume.
         :return: Response from the task retrieval request.
@@ -203,7 +167,7 @@ def get_task(self, task_id, create_connector_role_name):
     def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
         """
         Create a new model in OpenSearch and optionally deploy it.
-        
+
         :param model_name: Name of the model to create.
         :param description: Description of the model.
         :param connector_id: ID of the connector to associate with the model.
@@ -212,7 +176,17 @@ def create_model(self, model_name, description, connector_id, create_connector_r
         :return: ID of the created model.
         """
         try:
-            model_group_id = self.create_model_group(model_name, description, create_connector_role_name)
+            # Use ModelAccessControl methods directly without wrapping
+            model_group_id = self.model_access_control.get_model_group_id_by_name(model_name)
+            if not model_group_id:
+                self.model_access_control.register_model_group(
+                    name=model_name,
+                    description=description
+                )
+                model_group_id = self.model_access_control.get_model_group_id_by_name(model_name)
+                if not model_group_id:
+                    raise Exception("Failed to create model group.")
+
             payload = {
                 "name": model_name,
                 "function_name": "remote",
@@ -258,7 +232,7 @@ def create_model(self, model_name, description, connector_id, create_connector_r
     def deploy_model(self, model_id):
         """
         Deploy a specified model in OpenSearch.
-        
+
         :param model_id: ID of the model to deploy.
         :return: Response from the deployment request.
         """
@@ -274,7 +248,7 @@ def deploy_model(self, model_id):
     def predict(self, model_id, payload):
         """
         Make a prediction using the specified model and input payload.
-        
+
         :param model_id: ID of the model to use for prediction.
         :param payload: Input data for prediction.
         :return: Response from the prediction request.
@@ -293,7 +267,7 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
                                      create_connector_input, sleep_time_in_seconds=10):
         """
         Create a connector in OpenSearch using a secret for credentials.
-        
+
         :param secret_name: Name of the secret to create or use.
         :param secret_value: Value of the secret.
         :param connector_role_name: Name of the IAM role for the connector.
@@ -421,7 +395,7 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
                                    create_connector_input, sleep_time_in_seconds=10):
         """
         Create a connector in OpenSearch using an IAM role for credentials.
-        
+
         :param connector_role_inline_policy: Inline policy for the connector IAM role.
         :param connector_role_name: Name of the IAM role for the connector.
         :param create_connector_role_name: Name of the IAM role to assume for creating the connector.

From c02fe1b377f5890b7b558675a4af243392398b5b Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Wed, 4 Dec 2024 19:34:18 -0800
Subject: [PATCH 24/42] Removed duplicate method, and deleted unused method

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/ingest.py     |  1 -
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 65 -------------------
 setup.py                                      |  2 +-
 3 files changed, 1 insertion(+), 67 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 1a27a641..8e20e3eb 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -8,7 +8,6 @@
 import os
 import glob
 import json
-import tiktoken
 from tqdm import tqdm
 from colorama import Fore, Style, init
 from typing import List, Dict
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 33a30621..2bcb9042 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -462,60 +462,6 @@ def initialize_opensearch_client(self) -> bool:
             print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
             return False
 
-    def initialize_opensearch_client(self) -> bool:
-        """
-        Initialize the OpenSearch client based on the service type and configuration.
-
-        :return: True if the client is initialized successfully, False otherwise.
-        """
-        if not self.opensearch_endpoint:
-            print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
-            return False
-
-        parsed_url = urlparse(self.opensearch_endpoint)
-        host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
-
-        # Determine the authentication method based on the service type
-        if self.service_type == 'serverless':
-            credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
-        elif self.service_type == 'managed':
-            if not self.opensearch_username or not self.opensearch_password:
-                print(f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n")
-                return False
-            auth = (self.opensearch_username, self.opensearch_password)
-        elif self.service_type == 'open-source':
-            if self.opensearch_username and self.opensearch_password:
-                auth = (self.opensearch_username, self.opensearch_password)
-            else:
-                auth = None  # No authentication
-        else:
-            print("Invalid service type. Please check your configuration.")
-            return False
-
-        # Determine SSL settings based on the endpoint scheme
-        use_ssl = parsed_url.scheme == 'https'
-        verify_certs = True  # Always verify certificates unless you have a specific reason not to
-
-        try:
-            # Initialize the OpenSearch client
-            self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'port': port}],
-                http_auth=auth,
-                use_ssl=use_ssl,
-                verify_certs=verify_certs,
-                ssl_show_warn=False,          # Suppress SSL warnings
-                # ssl_context=ssl_context,      # Not needed unless you have custom certificates
-                connection_class=RequestsHttpConnection,
-                pool_maxsize=20
-            )
-            print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
-            return True
-        except Exception as ex:
-            # Handle initialization errors
-            print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
-            return False
 
     def get_knn_index_details(self) -> tuple:
         """
@@ -621,17 +567,6 @@ def save_config(self, config: dict):
         config_path = os.path.abspath(self.CONFIG_FILE)
         with open(self.CONFIG_FILE, 'w') as f:
             parser.write(f)
-    def get_truncated_name(self, base_name: str, max_length: int = 32) -> str:
-        """
-        Truncate a name to fit within a specified length.
-
-        :param base_name: Original name
-        :param max_length: Maximum allowed length
-        :return: Truncated name
-        """
-        if len(base_name) <= max_length:
-            return base_name
-        return base_name[:max_length-3] + "..."
 
     def setup_command(self):
         """
diff --git a/setup.py b/setup.py
index 467e95f6..f935df39 100644
--- a/setup.py
+++ b/setup.py
@@ -112,7 +112,7 @@
     # Entry points for console scripts
     entry_points={
         'console_scripts': [
-            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag:main',
+            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag.rag:main',
         ],
     },
 )
\ No newline at end of file

From d877bcae30ac87c2c8a735e8491c1ee8c323b0d2 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 5 Dec 2024 00:33:35 -0800
Subject: [PATCH 25/42] Fixed chunking pipeline, query was not generating due
 to mismatchd vector fields, like name etc, updated knn index details and
 chunking details

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 config.ini                                    | 26 +++++++++++++++++++
 .../ml_commons/rag_pipeline/rag/ingest.py     |  7 +++--
 .../rag_pipeline/rag/opensearch_connector.py  | 22 +++++++++++-----
 .../ml_commons/rag_pipeline/rag/query.py      |  4 ++-
 .../ml_commons/rag_pipeline/rag/rag_setup.py  |  1 -
 5 files changed, 48 insertions(+), 12 deletions(-)
 create mode 100644 config.ini

diff --git a/config.ini b/config.ini
new file mode 100644
index 00000000..3a2afbae
--- /dev/null
+++ b/config.ini
@@ -0,0 +1,26 @@
+[DEFAULT]
+service_type = managed
+region = us-west-2
+iam_principal = arn:aws:iam::615299771255:user/hmumtazz
+collection_name = 
+opensearch_endpoint = https://search-hashim-test5-eivrlyacr3n653fnkkrg2yab7u.aos.us-west-2.on.aws
+opensearch_username = admin
+opensearch_password = MyPassword123!
+default_search_method = semantic
+llm_model_id = amazon.titan-text-express-v1
+llm_max_token_count = 1000
+llm_temperature = 0.7
+llm_top_p = 0.9
+llm_stop_sequences = 
+ingest_pipeline_name = text-chunking-ingest-pipeline
+index_name = nemaz
+embedding_dimension = 1536
+space_type = l2
+ef_construction = 512
+number_of_shards = 1
+number_of_replicas = 2
+passage_text_field = passage_text
+passage_chunk_field = passage_chunk
+embedding_field = passage_embedding
+embedding_model_id = ecFOjZMBEYoaB6B-K7-l
+
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index 8e20e3eb..dc0f186a 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -8,6 +8,7 @@
 import os
 import glob
 import json
+import tiktoken
 from tqdm import tqdm
 from colorama import Fore, Style, init
 from typing import List, Dict
@@ -201,10 +202,8 @@ def create_ingest_pipeline(self, pipeline_id: str):
                     {
                         "text_chunking": {
                             "algorithm": {
-                                "fixed_token_length": {
-                                    "token_limit": token_limit,
-                                    "overlap_rate": overlap_rate,
-                                    "tokenizer": tokenizer
+                                "delimiter": {
+                                    "delimiter": "."
                                 }
                             },
                             "field_map": {
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 1bf12dbc..912720e5 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -262,18 +262,28 @@ def search_by_vector(self, vector: list, k: int = 5) -> list:
         :param k: The number of top results to retrieve.
         :return: A list of search hits.
         """
+        # Retrieve field names from the config
+        embedding_field = self.config.get('embedding_field', 'passage_embedding')
+        passage_text_field = self.config.get('passage_text_field', 'passage_text')
+        passage_chunk_field = self.config.get('passage_chunk_field', 'passage_chunk')
+
         try:
-            # Execute the KNN search query
+            # Execute the KNN search query using the correct field name
             response = self.opensearch_client.search(
                 index=self.index_name,
                 body={
                     "size": k,
-                    "_source": ["nominee_text", "passage_chunk"],
+                    "_source": [passage_text_field, passage_chunk_field],
                     "query": {
-                        "knn": {
-                            "nominee_vector": {
-                                "vector": vector,
-                                "k": k
+                        "nested": {
+                            "path": embedding_field,
+                            "query": {
+                                "knn": {
+                                    f"{embedding_field}.knn": {
+                                        "vector": vector,
+                                        "k": k
+                                    }
+                                }
                             }
                         }
                     }
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 4881405b..20752d4b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -211,7 +211,9 @@ def bulk_query_semantic(self, queries: List[str], k: int = 5) -> List[dict]:
                 # Perform vector-based search
                 hits = self.opensearch.search_by_vector(vector, k)
                 # Concatenate the retrieved passages as context
-                context = '\n'.join([hit['_source']['nominee_text'] for hit in hits])
+                context = '\n'.join(
+                    [chunk for hit in hits for chunk in hit['_source'].get('passage_chunk', [])]
+                )
                 results.append({
                     'query': queries[i],
                     'context': context,
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 2bcb9042..18abf94f 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -19,7 +19,6 @@
 from urllib.parse import urlparse
 from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
 from colorama import Fore, Style, init
-import ssl
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless  

From f0194ecc7b70517597654e2059c552c617b9dcd0 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 5 Dec 2024 02:16:51 -0800
Subject: [PATCH 26/42] Remove config.ini from repository and add to .gitignore

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 config.ini | 26 --------------------------
 1 file changed, 26 deletions(-)
 delete mode 100644 config.ini

diff --git a/config.ini b/config.ini
deleted file mode 100644
index 3a2afbae..00000000
--- a/config.ini
+++ /dev/null
@@ -1,26 +0,0 @@
-[DEFAULT]
-service_type = managed
-region = us-west-2
-iam_principal = arn:aws:iam::615299771255:user/hmumtazz
-collection_name = 
-opensearch_endpoint = https://search-hashim-test5-eivrlyacr3n653fnkkrg2yab7u.aos.us-west-2.on.aws
-opensearch_username = admin
-opensearch_password = MyPassword123!
-default_search_method = semantic
-llm_model_id = amazon.titan-text-express-v1
-llm_max_token_count = 1000
-llm_temperature = 0.7
-llm_top_p = 0.9
-llm_stop_sequences = 
-ingest_pipeline_name = text-chunking-ingest-pipeline
-index_name = nemaz
-embedding_dimension = 1536
-space_type = l2
-ef_construction = 512
-number_of_shards = 1
-number_of_replicas = 2
-passage_text_field = passage_text
-passage_chunk_field = passage_chunk
-embedding_field = passage_embedding
-embedding_model_id = ecFOjZMBEYoaB6B-K7-l
-

From d354b25959536c84e1befb3f0ce77b61f3fdb2f9 Mon Sep 17 00:00:00 2001
From: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
Date: Thu, 5 Dec 2024 13:37:11 -0800
Subject: [PATCH 27/42] Update rag_setup.py to remove neural search line and
 serverless
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Removed references to serverless. Now the code only supports managed and open-source service types.
Removed the menu option for serverless.
For search methods, removed “neural” and only use “semantic” search.
Added a prompt to choose between semantic search with LLM and semantic search without LLM.
If semantic with LLM is chosen and the service type is managed, the code will prompt for LLM configuration.
If open-source is chosen, we skip AWS/Bedrock configurations and do not prompt for LLM registration since that requires AWS Bedrock.

Signed-off-by: hmumtazz <144855436+hmumtazz@users.noreply.github.com>
---
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 217 +++++++-----------
 1 file changed, 82 insertions(+), 135 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 18abf94f..f61b13d2 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -1,9 +1,10 @@
 # SPDX-License-Identifier: Apache-2.0
+
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors.
+# See GitHub history for details.
 
 import boto3
 import botocore
@@ -21,8 +22,7 @@
 from colorama import Fore, Style, init
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless  
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper 
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
 
 # Initialize colorama for colored terminal output
@@ -32,12 +32,11 @@
 class Setup:
     """
     Handles the setup and configuration of the OpenSearch environment.
-    Manages AWS credentials, OpenSearch client initialization, index creation,
+    Manages AWS credentials (if managed), OpenSearch client initialization, index creation,
     and model registration.
     """
     
     CONFIG_FILE = 'config.ini'
-    SERVICE_AOSS = 'opensearchserverless'
     SERVICE_BEDROCK = 'bedrock-runtime'
 
     def __init__(self):
@@ -51,15 +50,12 @@ def __init__(self):
         self.collection_name = self.config.get('collection_name', '')
         self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
         self.service_type = self.config.get('service_type', 'managed')
-        self.is_serverless = self.service_type == 'serverless'
         self.opensearch_username = self.config.get('opensearch_username', '')
         self.opensearch_password = self.config.get('opensearch_password', '')
-        self.aoss_client = None
         self.bedrock_client = None
         self.opensearch_client = None
         self.opensearch_domain_name = self.get_opensearch_domain_name()
         self.model_register = None
-        self.serverless = None  # Will be initialized if service_type is 'serverless'
 
     def check_and_configure_aws(self):
         """
@@ -117,8 +113,6 @@ def configure_aws(self):
     def load_config(self) -> dict:
         """
         Load configuration from the config file.
-
-        :return: Dictionary of configuration parameters
         """
         config = configparser.ConfigParser()
         if os.path.exists(self.CONFIG_FILE):
@@ -129,9 +123,6 @@ def load_config(self) -> dict:
     def get_password_with_asterisks(self, prompt="Enter password: ") -> str:
         """
         Get password input from user, masking it with asterisks.
-
-        :param prompt: Prompt message
-        :return: Entered password as a string
         """
         if sys.platform == 'win32':
             import msvcrt
@@ -156,7 +147,6 @@ def get_password_with_asterisks(self, prompt="Enter password: ") -> str:
                     except UnicodeDecodeError:
                         continue
         else:
-            import termios, tty
             fd = sys.stdin.fileno()
             old_settings = termios.tcgetattr(fd)
             try:
@@ -187,44 +177,31 @@ def setup_configuration(self):
         """
         config = self.load_config()
 
-
-        # First, prompt for service type
+        # Prompt for service type
         print("\nChoose OpenSearch service type:")
-        print("1. Serverless")
-        print("2. Managed")
-        print("3. Open-source")
-        service_choice = input("Enter your choice (1-3): ").strip()
+        print("1. Managed")
+        print("2. Open-source")
+        service_choice = input("Enter your choice (1-2): ").strip()
 
         if service_choice == '1':
-            self.service_type = 'serverless'
-        elif service_choice == '2':
             self.service_type = 'managed'
-        elif service_choice == '3':
+        elif service_choice == '2':
             self.service_type = 'open-source'
         else:
             print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'managed'.{Style.RESET_ALL}")
             self.service_type = 'managed'
 
         # Based on service type, prompt for different configurations
-        if self.service_type in ['serverless', 'managed']:
-            # For 'serverless' and 'managed', prompt for AWS credentials and related info
+        if self.service_type == 'managed':
             self.check_and_configure_aws()
-
             self.aws_region = input(f"\nEnter your AWS Region [{self.aws_region}]: ").strip() or self.aws_region
             self.iam_principal = input(f"Enter your IAM Principal ARN [{self.iam_principal}]: ").strip() or self.iam_principal
-
-            if self.service_type == 'serverless':
-                self.collection_name = input("\nEnter the name for your OpenSearch collection: ").strip()
-                self.opensearch_endpoint = None
-                self.opensearch_username = None
-                self.opensearch_password = None
-            elif self.service_type == 'managed':
-                self.opensearch_endpoint = input("\nEnter your OpenSearch domain endpoint: ").strip()
-                self.opensearch_username = input("Enter your OpenSearch username: ").strip()
-                self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
-                self.collection_name = ''
+            self.opensearch_endpoint = input("\nEnter your OpenSearch domain endpoint: ").strip()
+            self.opensearch_username = input("Enter your OpenSearch username: ").strip()
+            self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
+            self.collection_name = ''
         elif self.service_type == 'open-source':
-            # For 'open-source', skip AWS configurations
+            # For open-source, skip AWS configurations
             print("\n--- Open-source OpenSearch Setup ---")
             default_endpoint = 'https://localhost:9200'
             self.opensearch_endpoint = input(f"\nPress Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
@@ -236,7 +213,7 @@ def setup_configuration(self):
                 self.opensearch_username = None
                 self.opensearch_password = None
             self.collection_name = ''
-            # For open-source, AWS region and IAM principal are not needed
+            # AWS region and IAM principal not needed
             self.aws_region = ''
             self.iam_principal = ''
 
@@ -252,23 +229,21 @@ def setup_configuration(self):
         }
 
         # Now, prompt for default search method
-        print("\nChoose the default search method:")
-        print("1. Neural Search")
-        print("2. Semantic Search")
+        # We only do semantic search now
+        print("\nSince we're only using semantic search, choose one:")
+        print("1. Semantic search WITH LLM")
+        print("2. Semantic search WITHOUT LLM")
         search_choice = input("Enter your choice (1-2): ").strip()
 
         if search_choice == '1':
-            default_search_method = 'neural'
-        elif search_choice == '2':
-            default_search_method = 'semantic'
+            default_search_method = 'semantic_with_llm'
         else:
-            print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'neural'.{Style.RESET_ALL}")
-            default_search_method = 'neural'
+            default_search_method = 'semantic_no_llm'
 
         self.config['default_search_method'] = default_search_method
 
-        if default_search_method == 'semantic':
-            # Prompt the user to select an LLM model for semantic search
+        # If semantic with LLM chosen and we are in managed mode, prompt for LLM configuration
+        if default_search_method == 'semantic_with_llm' and self.service_type == 'managed':
             print("\nSelect an LLM model for semantic search:")
             available_models = [
                 ("amazon.titan-text-lite-v1", "Bedrock Titan Text Lite V1"),
@@ -319,6 +294,13 @@ def setup_configuration(self):
             self.config['llm_temperature'] = str(temperature)
             self.config['llm_top_p'] = str(topP)
             self.config['llm_stop_sequences'] = ','.join(stopSequences)
+        else:
+            # No LLM configurations needed
+            self.config['llm_model_id'] = ''
+            self.config['llm_max_token_count'] = ''
+            self.config['llm_temperature'] = ''
+            self.config['llm_top_p'] = ''
+            self.config['llm_stop_sequences'] = ''
 
         # Prompt for ingest pipeline name
         default_pipeline_name = 'text-chunking-ingest-pipeline'
@@ -333,53 +315,40 @@ def setup_configuration(self):
         self.save_config(self.config)
         print(f"\n{Fore.GREEN}Configuration saved successfully to {os.path.abspath(self.CONFIG_FILE)}.{Style.RESET_ALL}\n")
 
-
     def initialize_clients(self) -> bool:
         """
-        Initialize AWS clients (AOSS and Bedrock) only if not open-source.
-
-        :return: True if clients initialized successfully or open-source, False otherwise
+        Initialize AWS clients (Bedrock) only if managed. No AWS clients needed for open-source.
         """
         if self.service_type == 'open-source':
             return True  # No AWS clients needed
-
+        # Managed: Initialize Bedrock
         try:
             boto_config = Config(
                 region_name=self.aws_region,
                 signature_version='v4',
                 retries={'max_attempts': 10, 'mode': 'standard'}
             )
-            if self.is_serverless:
-                # Initialize AOSS client for serverless service
-                self.aoss_client = boto3.client(self.SERVICE_AOSS, config=boto_config)
-            # Initialize Bedrock client for managed or serverless services
-            self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region)
-            
-            time.sleep(7)  # Wait for clients to initialize
-            print(f"{Fore.GREEN}AWS clients initialized successfully.{Style.RESET_ALL}\n")
+            self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region, config=boto_config)
+            time.sleep(2)
+            print(f"{Fore.GREEN}AWS Bedrock client initialized successfully.{Style.RESET_ALL}\n")
             return True
         except Exception as e:
-            # Handle initialization errors
-            print(f"{Fore.RED}Failed to initialize AWS clients: {e}{Style.RESET_ALL}")
+            print(f"{Fore.RED}Failed to initialize AWS Bedrock client: {e}{Style.RESET_ALL}")
             return False
 
     def get_opensearch_domain_name(self) -> str:
         """
         Extract the domain name from the OpenSearch endpoint URL.
-
-        :return: Domain name if extraction is successful, None otherwise
         """
         if self.opensearch_endpoint:
             parsed_url = urlparse(self.opensearch_endpoint)
-            hostname = parsed_url.hostname  # e.g., 'search-your-domain-name-uniqueid.region.es.amazonaws.com'
-            if hostname:
-                # Split the hostname into parts
+            hostname = parsed_url.hostname
+            if hostname and 'amazonaws.com' in hostname:
+                # Attempt to parse a managed domain name
                 parts = hostname.split('.')
-                domain_part = parts[0]  # e.g., 'search-your-domain-name-uniqueid'
-                # Remove the 'search-' prefix if present
+                domain_part = parts[0]
                 if domain_part.startswith('search-'):
                     domain_part = domain_part[len('search-'):]
-                # Remove the unique ID suffix after the domain name
                 domain_name = domain_part.rsplit('-', 1)[0]
                 print(f"Extracted domain name: {domain_name}\n")
                 return domain_name
@@ -388,11 +357,7 @@ def get_opensearch_domain_name(self) -> str:
     @staticmethod
     def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
         """
-        Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
-
-        :param region: AWS region
-        :param domain_name: Name of the OpenSearch domain
-        :return: Tuple of (domain_endpoint, domain_arn) if successful, (None, None) otherwise
+        Retrieve the OpenSearch domain endpoint and ARN for a managed domain.
         """
         try:
             client = boto3.client('opensearch', region_name=region)
@@ -405,12 +370,9 @@ def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
             print(f"{Fore.RED}Error retrieving OpenSearch domain info: {e}{Style.RESET_ALL}")
             return None, None
 
-# In Setup class, modify the initialize_opensearch_client method
     def initialize_opensearch_client(self) -> bool:
         """
         Initialize the OpenSearch client based on the service type and configuration.
-
-        :return: True if the client is initialized successfully, False otherwise.
         """
         if not self.opensearch_endpoint:
             print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
@@ -418,13 +380,10 @@ def initialize_opensearch_client(self) -> bool:
 
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200) 
 
-        # Determine the authentication method based on the service type
-        if self.service_type == 'serverless':
-            credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
-        elif self.service_type == 'managed':
+        # Determine auth based on service type
+        if self.service_type == 'managed':
             if not self.opensearch_username or not self.opensearch_password:
                 print(f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n")
                 return False
@@ -433,39 +392,33 @@ def initialize_opensearch_client(self) -> bool:
             if self.opensearch_username and self.opensearch_password:
                 auth = (self.opensearch_username, self.opensearch_password)
             else:
-                auth = None  # No authentication
+                auth = None
         else:
             print("Invalid service type. Please check your configuration.")
             return False
 
-        # Determine SSL settings based on the endpoint scheme
         use_ssl = parsed_url.scheme == 'https'
-        verify_certs = True  # Always verify certificates unless you have a specific reason not to
+        verify_certs = True
 
         try:
-            # Initialize the OpenSearch client
             self.opensearch_client = OpenSearch(
                 hosts=[{'host': host, 'port': port}],
                 http_auth=auth,
                 use_ssl=use_ssl,
                 verify_certs=verify_certs,
-                ssl_show_warn=False,          # Suppress SSL warnings
-                # ssl_context=ssl_context,      # Not needed unless you have custom certificates
+                ssl_show_warn=False,
                 connection_class=RequestsHttpConnection,
                 pool_maxsize=20
             )
             print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
             return True
         except Exception as ex:
-            # Handle initialization errors
             print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
             return False
 
-
     def get_knn_index_details(self) -> tuple:
         """
-        Prompt user for KNN index details (embedding dimension, space type, ef_construction,
-        number of shards, number of replicas, and field names).
+        Prompt user for KNN index details.
         """
         dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ").strip()
         if dimension_input == "":
@@ -493,7 +446,7 @@ def get_knn_index_details(self) -> tuple:
         elif space_choice == "3":
             space_type = "innerproduct"
         else:
-            print("Invalid choice. Using default space type of L2 (Euclidean distance).")
+            print("Invalid choice. Using default space type of L2.")
             space_type = "l2"
 
         print(f"Space type set to: {space_type}")
@@ -558,8 +511,6 @@ def get_knn_index_details(self) -> tuple:
     def save_config(self, config: dict):
         """
         Save configuration to the config file.
-
-        :param config: Dictionary of configuration parameters
         """
         parser = configparser.ConfigParser()
         parser['DEFAULT'] = config
@@ -574,14 +525,11 @@ def setup_command(self):
         # Begin setup by configuring necessary parameters
         self.setup_configuration()
 
-        if self.service_type != 'open-source' and not self.initialize_clients():
+        if self.service_type == 'managed' and not self.initialize_clients():
             print(f"\n{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n")
             return
 
-        if self.service_type == 'serverless':
-            # Serverless-specific setup can be added here if needed
-            pass
-        elif self.service_type == 'managed':
+        if self.service_type == 'managed':
             if not self.opensearch_endpoint:
                 print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
@@ -593,11 +541,10 @@ def setup_command(self):
                 print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
                 return
             else:
-                self.opensearch_domain_name = None  # Not required for open-source
+                self.opensearch_domain_name = None
 
         # Initialize OpenSearch client
         if self.initialize_opensearch_client():
-
             # Prompt user to choose between creating a new index or using an existing one
             print("Do you want to create a new KNN index or use an existing one?")
             print("1. Create a new KNN index")
@@ -605,10 +552,7 @@ def setup_command(self):
             index_choice = input("Enter your choice (1-2): ").strip()
 
             if index_choice == '1':
-                # Proceed to create a new index
                 self.index_name = input("\nEnter a name for your new KNN index in OpenSearch: ").strip()
-
-                # Save the index name in the configuration
                 self.config['index_name'] = self.index_name
                 self.save_config(self.config)
 
@@ -616,18 +560,16 @@ def setup_command(self):
                 embedding_dimension, space_type, ef_construction, number_of_shards, number_of_replicas, \
                 passage_text_field, passage_chunk_field, embedding_field = self.get_knn_index_details()
 
-                # Create an instance of OpenSearchConnector
                 self.opensearch_connector = OpenSearchConnector(self.config)
-                self.opensearch_connector.opensearch_client = self.opensearch_client  # Use the initialized client
-                self.opensearch_connector.index_name = self.index_name  # Set the index name
+                self.opensearch_connector.opensearch_client = self.opensearch_client
+                self.opensearch_connector.index_name = self.index_name
 
-                # Verify and create the index
                 if self.opensearch_connector.verify_and_create_index(
                     embedding_dimension, space_type, ef_construction, number_of_shards,
                     number_of_replicas, passage_text_field, passage_chunk_field, embedding_field
                 ):
                     print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
-                    # Save index details to config
+                    # Save index details
                     self.config['embedding_dimension'] = str(embedding_dimension)
                     self.config['space_type'] = space_type
                     self.config['ef_construction'] = str(ef_construction)
@@ -641,7 +583,6 @@ def setup_command(self):
                     print(f"\n{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
                     return
             elif index_choice == '2':
-                # Use existing index
                 existing_index_name = input("\nEnter the name of your existing KNN index: ").strip()
                 if not existing_index_name:
                     print(f"\n{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n")
@@ -662,18 +603,25 @@ def setup_command(self):
                         settings = index_info[self.index_name]['settings']['index']
                         mappings = index_info[self.index_name]['mappings']['properties']
 
-                        # Extract embedding dimension from the mapping
-                        embedding_field_mappings = mappings.get('passage_embedding', {})
-                        knn_mappings = embedding_field_mappings.get('properties', {}).get('knn', {})
-                        embedding_dimension = knn_mappings.get('dimension', 768)
-                        method = knn_mappings.get('method', {})
-                        space_type = method.get('space_type', 'l2')
-                        ef_construction = method.get('parameters', {}).get('ef_construction', 512)
+                        # Attempt to retrieve known fields
+                        # For simplicity, assume defaults if they don't exist
+                        embedding_field = 'passage_embedding'
+                        embedding_field_mappings = mappings.get(embedding_field, {})
+                        knn_mappings = embedding_field_mappings.get('method', {})
+                        # These values might not be perfectly retrievable depending on the index mapping
+                        # We'll do best-effort.
+                        embedding_dimension = 768
+                        space_type = 'l2'
+                        ef_construction = 512
+                        if 'method' in embedding_field_mappings:
+                            method = embedding_field_mappings['method']
+                            space_type = method.get('space_type', 'l2')
+                            ef_construction = method.get('parameters', {}).get('ef_construction', 512)
+
                         number_of_shards = settings.get('number_of_shards', '2')
                         number_of_replicas = settings.get('number_of_replicas', '2')
-                        passage_text_field = 'passage_text'  # Assuming default, or you can extract if stored differently
-                        passage_chunk_field = 'passage_chunk'  # Assuming default
-                        embedding_field = 'passage_embedding'  # Assuming default
+                        passage_text_field = 'passage_text'
+                        passage_chunk_field = 'passage_chunk'
 
                         print(f"\nUsing existing index '{self.index_name}' with the following settings:")
                         print(f"Embedding Dimension: {embedding_dimension}")
@@ -685,7 +633,7 @@ def setup_command(self):
                         print(f"Passage Chunk Field: '{passage_chunk_field}'")
                         print(f"Embedding Field: '{embedding_field}'\n")
 
-                        # Save index details to config
+                        # Save index details
                         self.config['embedding_dimension'] = str(embedding_dimension)
                         self.config['space_type'] = space_type
                         self.config['ef_construction'] = str(ef_construction)
@@ -700,21 +648,20 @@ def setup_command(self):
                     print(f"\n{Fore.RED}Error retrieving index details: {ex}{Style.RESET_ALL}\n")
                     return
 
-            # Proceed with model registration
-            # Initialize ModelRegister now that OpenSearch client and domain name are available
+            # Proceed with model registration if managed and semantic_with_llm
             self.model_register = ModelRegister(
                 self.config,
                 self.opensearch_client,
                 self.opensearch_domain_name
             )
 
-            # Model Registration
-            if self.service_type != 'open-source':
-                # AWS-managed OpenSearch: Proceed with model registration
+            if self.service_type == 'managed' and self.config['default_search_method'] == 'semantic_with_llm':
+                # Managed OpenSearch: Proceed with model registration for LLM
                 self.model_register.prompt_model_registration()
             else:
-                # Open-source OpenSearch: Provide instructions or automate model registration
-                self.model_register.prompt_opensource_model_registration()
+                # Open-source or semantic without LLM: no model registration needed
+                print(f"{Fore.GREEN}Setup complete. No LLM model registration required.{Style.RESET_ALL}")
+
         else:
             # Handle failure to initialize OpenSearch client
-            print(f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
\ No newline at end of file
+            print(f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")

From 1ca4221d37a29fed0487b7844cb694b070fb6657 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 5 Dec 2024 14:25:30 -0800
Subject: [PATCH 28/42] Updated query.py to reflect search changes

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 20752d4b..1a899785 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -304,7 +304,7 @@ def query_command(self, queries: List[str], num_results: int = 5):
                     break
                 queries = [query_text]
 
-            if search_method == 'neural':
+            if search_method == 'semantic_no_llm':
                 # Proceed with neural search
                 results = self.bulk_query_neural(queries, k=num_results)
 
@@ -330,7 +330,7 @@ def query_command(self, queries: List[str], num_results: int = 5):
                             print("\nNo relevant sentences found.")
                     else:
                         print("\nNo documents found for this query.")
-            elif search_method == 'semantic':
+            elif search_method == 'semantic_with_llm':
                 # Proceed with semantic search
                 if not self.bedrock_client or not self.llm_model_id:
                     print(f"\n{Fore.RED}LLM model is not configured. Please run setup to select an LLM model.{Style.RESET_ALL}")

From 8b97791d4890e23e89ea06d90396c4b952d8ef06 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 5 Dec 2024 15:57:31 -0800
Subject: [PATCH 29/42] Missing innit file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/rag_pipeline/__init__.py | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/__init__.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
new file mode 100644
index 00000000..e69de29b

From fe6f8c58b600e5b78b3c1df115a26fd68eca7de9 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 5 Dec 2024 16:02:03 -0800
Subject: [PATCH 30/42] missing init file

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/ml_models/__init__.py             | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
new file mode 100644
index 00000000..e69de29b

From 34f7fd4eb4bb2be56e5d3de13772bf4cb6a8a616 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 6 Dec 2024 05:26:30 -0800
Subject: [PATCH 31/42] Fixed domain ARN/domain name error, changed directory,
 for IAM, SecretsHelper

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../{rag_pipeline/rag => }/IAMRoleHelper.py    |  0
 .../{rag_pipeline/rag => }/SecretsHelper.py    |  0
 .../rag_pipeline/rag/AIConnectorHelper.py      |  4 ++--
 .../rag_pipeline/rag/model_register.py         |  2 +-
 .../ml_commons/rag_pipeline/rag/rag_setup.py   | 18 ++++++++++++------
 tests/rag/test_IAMRoleHelper.py                |  2 +-
 ...est_SecretsHelper => test_SecretsHelper.py} |  2 +-
 7 files changed, 17 insertions(+), 11 deletions(-)
 rename opensearch_py_ml/ml_commons/{rag_pipeline/rag => }/IAMRoleHelper.py (100%)
 rename opensearch_py_ml/ml_commons/{rag_pipeline/rag => }/SecretsHelper.py (100%)
 rename tests/rag/{test_SecretsHelper => test_SecretsHelper.py} (98%)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
similarity index 100%
rename from opensearch_py_ml/ml_commons/rag_pipeline/rag/IAMRoleHelper.py
rename to opensearch_py_ml/ml_commons/IAMRoleHelper.py
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py b/opensearch_py_ml/ml_commons/SecretsHelper.py
similarity index 100%
rename from opensearch_py_ml/ml_commons/rag_pipeline/rag/SecretsHelper.py
rename to opensearch_py_ml/ml_commons/SecretsHelper.py
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index e4074faf..0a0be872 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -14,8 +14,8 @@
 from opensearchpy import OpenSearch, RequestsHttpConnection
 from urllib.parse import urlparse
 
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper import SecretHelper
+from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
+from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
 from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
 
 
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
index da21c62d..c442e98b 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -13,7 +13,7 @@
 from urllib.parse import urlparse
 from colorama import Fore, Style, init
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper
+from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import BedrockModel
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import OpenAIModel
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import CohereModel
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index f61b13d2..f9207853 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -339,20 +339,26 @@ def initialize_clients(self) -> bool:
     def get_opensearch_domain_name(self) -> str:
         """
         Extract the domain name from the OpenSearch endpoint URL.
+
+        :return: Domain name if extraction is successful, None otherwise
         """
         if self.opensearch_endpoint:
             parsed_url = urlparse(self.opensearch_endpoint)
-            hostname = parsed_url.hostname
-            if hostname and 'amazonaws.com' in hostname:
-                # Attempt to parse a managed domain name
+            hostname = parsed_url.hostname  # e.g., 'search-your-domain-name-uniqueid.region.es.amazonaws.com'
+            if hostname:
+                # Split the hostname into parts
                 parts = hostname.split('.')
-                domain_part = parts[0]
+                domain_part = parts[0]  # e.g., 'search-your-domain-name-uniqueid'
+                # Remove the 'search-' prefix if present
                 if domain_part.startswith('search-'):
                     domain_part = domain_part[len('search-'):]
+                # Remove the unique ID suffix after the domain name
                 domain_name = domain_part.rsplit('-', 1)[0]
                 print(f"Extracted domain name: {domain_name}\n")
                 return domain_name
         return None
+    
+
 
     @staticmethod
     def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
@@ -465,9 +471,9 @@ def get_knn_index_details(self) -> tuple:
         print(f"ef_construction set to: {ef_construction}\n")
 
         # Prompt for number of shards
-        shards_input = input("\nEnter number of shards (Press Enter for default value 2): ").strip()
+        shards_input = input("\nEnter number of shards (Press Enter for default value 1): ").strip()
         if shards_input == "":
-            number_of_shards = 2
+            number_of_shards = 1
         else:
             try:
                 number_of_shards = int(shards_input)
diff --git a/tests/rag/test_IAMRoleHelper.py b/tests/rag/test_IAMRoleHelper.py
index 035a752d..a58fd933 100644
--- a/tests/rag/test_IAMRoleHelper.py
+++ b/tests/rag/test_IAMRoleHelper.py
@@ -29,7 +29,7 @@
 import logging
 
 # Assuming IAMRoleHelper is defined in iam_role_helper.py
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper import IAMRoleHelper  # Replace with the actual module path if different
+from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper  # Replace with the actual module path if different
 
 class TestIAMRoleHelper(unittest.TestCase):
 
diff --git a/tests/rag/test_SecretsHelper b/tests/rag/test_SecretsHelper.py
similarity index 98%
rename from tests/rag/test_SecretsHelper
rename to tests/rag/test_SecretsHelper.py
index 0c077d41..cde69492 100644
--- a/tests/rag/test_SecretsHelper
+++ b/tests/rag/test_SecretsHelper.py
@@ -28,7 +28,7 @@
 import json
 import logging
 # Adjust the import path as necessary
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper import SecretHelper
+from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
 
 class TestSecretHelper(unittest.TestCase):
     @classmethod

From 39a188396211500cbed34141939ed8d29fe9b459 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 6 Dec 2024 05:42:48 -0800
Subject: [PATCH 32/42] Updated AIConnectorHelper to use existing methods, like
 get task, and creating a connector

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../rag_pipeline/rag/AIConnectorHelper.py     | 99 +++++++------------
 1 file changed, 33 insertions(+), 66 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index 0a0be872..9d795c52 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -17,6 +17,8 @@
 from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
 from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
 from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
+from opensearch_py_ml.ml_commons.ml_commons_client import MLCommonClient
+from opensearch_py_ml.ml_commons.model_connector import Connector
 
 
 class AIConnectorHelper:
@@ -74,15 +76,14 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
         )
 
         self.secret_helper = SecretHelper(self.region)
+        
+        # Initialize MLCommonClient for reuse of get_task_info
+        self.ml_commons_client = MLCommonClient(self.opensearch_client)
 
     @staticmethod
     def get_opensearch_domain_info(region, domain_name):
         """
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
-
-        :param region: AWS region.
-        :param domain_name: Name of the OpenSearch domain.
-        :return: Tuple containing domain endpoint and ARN.
         """
         try:
             opensearch_client = boto3.client('opensearch', region_name=region)
@@ -98,9 +99,6 @@ def get_opensearch_domain_info(region, domain_name):
     def get_ml_auth(self, create_connector_role_name):
         """
         Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
-
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :return: AWS4Auth object with temporary credentials.
         """
         create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         if not create_connector_role_arn:
@@ -119,14 +117,12 @@ def get_ml_auth(self, create_connector_role_name):
     def create_connector(self, create_connector_role_name, payload):
         """
         Create a connector in OpenSearch using the specified role and payload.
-
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :param payload: Payload data for creating the connector.
-        :return: ID of the created connector.
+        Reusing create_standalone_connector from Connector class.
         """
+        # Assume role and create a temporary authenticated OS client
         create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
         temp_credentials = self.iam_helper.assume_role(create_connector_role_arn)
-        awsauth = AWS4Auth(
+        temp_awsauth = AWS4Auth(
             temp_credentials["AccessKeyId"],
             temp_credentials["SecretAccessKey"],
             self.region,
@@ -134,32 +130,35 @@ def create_connector(self, create_connector_role_name, payload):
             session_token=temp_credentials["SessionToken"],
         )
 
-        path = '/_plugins/_ml/connectors/_create'
-        url = self.opensearch_domain_url + path
+        parsed_url = urlparse(self.opensearch_domain_url)
+        host = parsed_url.hostname
+        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)
 
-        headers = {"Content-Type": "application/json"}
+        temp_os_client = OpenSearch(
+            hosts=[{'host': host, 'port': port}],
+            http_auth=temp_awsauth,
+            use_ssl=(parsed_url.scheme == 'https'),
+            verify_certs=True,
+            connection_class=RequestsHttpConnection
+        )
+
+        temp_connector = Connector(temp_os_client)
+        response = temp_connector.create_standalone_connector(payload)
 
-        response = requests.post(url, auth=awsauth, json=payload, headers=headers)
-        print(response.text)
-        connector_id = json.loads(response.text).get('connector_id')
+        print(response)
+        connector_id = response.get('connector_id')
         return connector_id
 
     def get_task(self, task_id, create_connector_role_name):
         """
         Retrieve the status of a specific task using its ID.
-
-        :param task_id: ID of the task to retrieve.
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :return: Response from the task retrieval request.
+        Reusing the get_task_info method from MLCommonClient.
         """
         try:
-            awsauth = self.get_ml_auth(create_connector_role_name)
-            response = requests.get(
-                f'{self.opensearch_domain_url}/_plugins/_ml/tasks/{task_id}',
-                auth=awsauth
-            )
-            print("Get Task Response:", response.text)
-            return response
+            # No need to authenticate here again, ml_commons_client uses self.opensearch_client
+            task_response = self.ml_commons_client.get_task_info(task_id)
+            print("Get Task Response:", json.dumps(task_response))
+            return task_response
         except Exception as e:
             print(f"Error in get_task: {e}")
             raise
@@ -167,13 +166,6 @@ def get_task(self, task_id, create_connector_role_name):
     def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
         """
         Create a new model in OpenSearch and optionally deploy it.
-
-        :param model_name: Name of the model to create.
-        :param description: Description of the model.
-        :param connector_id: ID of the connector to associate with the model.
-        :param create_connector_role_name: Name of the IAM role to assume.
-        :param deploy: Boolean indicating whether to deploy the model immediately.
-        :return: ID of the created model.
         """
         try:
             # Use ModelAccessControl methods directly without wrapping
@@ -215,12 +207,11 @@ def create_model(self, model_name, description, connector_id, create_connector_r
                 # Handle asynchronous task
                 time.sleep(2)  # Wait for task to complete
                 task_response = self.get_task(response_data['task_id'], create_connector_role_name)
-                print("Task Response:", task_response.text)
-                task_result = json.loads(task_response.text)
-                if 'model_id' in task_result:
-                    return task_result['model_id']
+                print("Task Response:", json.dumps(task_response))
+                if 'model_id' in task_response:
+                    return task_response['model_id']
                 else:
-                    raise KeyError(f"'model_id' not found in task response: {task_result}")
+                    raise KeyError(f"'model_id' not found in task response: {task_response}")
             elif 'error' in response_data:
                 raise Exception(f"Error creating model: {response_data['error']}")
             else:
@@ -232,9 +223,6 @@ def create_model(self, model_name, description, connector_id, create_connector_r
     def deploy_model(self, model_id):
         """
         Deploy a specified model in OpenSearch.
-
-        :param model_id: ID of the model to deploy.
-        :return: Response from the deployment request.
         """
         headers = {"Content-Type": "application/json"}
         response = requests.post(
@@ -248,10 +236,6 @@ def deploy_model(self, model_id):
     def predict(self, model_id, payload):
         """
         Make a prediction using the specified model and input payload.
-
-        :param model_id: ID of the model to use for prediction.
-        :param payload: Input data for prediction.
-        :return: Response from the prediction request.
         """
         headers = {"Content-Type": "application/json"}
         response = requests.post(
@@ -267,14 +251,6 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
                                      create_connector_input, sleep_time_in_seconds=10):
         """
         Create a connector in OpenSearch using a secret for credentials.
-
-        :param secret_name: Name of the secret to create or use.
-        :param secret_value: Value of the secret.
-        :param connector_role_name: Name of the IAM role for the connector.
-        :param create_connector_role_name: Name of the IAM role to assume for creating the connector.
-        :param create_connector_input: Input payload for creating the connector.
-        :param sleep_time_in_seconds: Time to wait for IAM role propagation.
-        :return: ID of the created connector.
         """
         # Step 1: Create Secret
         print('Step1: Create Secret')
@@ -380,7 +356,6 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
 
         # Step 4: Create connector
         print('Step 4: Create connector in OpenSearch')
-        # Wait to ensure IAM role propagation
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
         payload['credential'] = {
@@ -395,13 +370,6 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
                                    create_connector_input, sleep_time_in_seconds=10):
         """
         Create a connector in OpenSearch using an IAM role for credentials.
-
-        :param connector_role_inline_policy: Inline policy for the connector IAM role.
-        :param connector_role_name: Name of the IAM role for the connector.
-        :param create_connector_role_name: Name of the IAM role to assume for creating the connector.
-        :param create_connector_input: Input payload for creating the connector.
-        :param sleep_time_in_seconds: Time to wait for IAM role propagation.
-        :return: ID of the created connector.
         """
         # Step 1: Create IAM role configured in connector
         trust_policy = {
@@ -485,7 +453,6 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
 
         # Step 3: Create connector
         print('Step 3: Create connector in OpenSearch')
-        # Wait to ensure IAM role propagation
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
         payload['credential'] = {
@@ -493,4 +460,4 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
         }
         connector_id = self.create_connector(create_connector_role_name, payload)
         print('----------')
-        return connector_id
\ No newline at end of file
+        return connector_id

From 2dfa609d46c7dc360f2821bcbafbeb41b1b9102b Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 6 Dec 2024 06:44:55 -0800
Subject: [PATCH 33/42] Updated License Headers

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/__init__.py         |  6 ++++++
 .../ml_commons/rag_pipeline/rag/__init__.py     |  6 ++++++
 .../rag_pipeline/rag/ml_models/BedrockModel.py  | 17 -----------------
 .../rag_pipeline/rag/ml_models/CohereModel.py   | 16 ----------------
 .../rag/ml_models/HuggingFaceModel.py           | 17 -----------------
 .../rag_pipeline/rag/ml_models/OpenAIModel.py   | 17 -----------------
 .../rag_pipeline/rag/ml_models/PyTorchModel.py  | 17 -----------------
 .../rag/ml_models/SageMakerModel.py             | 17 -----------------
 .../rag_pipeline/rag/ml_models/__init__.py      |  6 ++++++
 .../ml_commons/rag_pipeline/rag/rag_setup.py    |  5 ++---
 tests/rag/test_AiConnectorClass.py              | 17 -----------------
 tests/rag/test_IAMRoleHelper.py                 | 17 -----------------
 tests/rag/test_Model_Register.py                | 17 -----------------
 tests/rag/test_SecretsHelper.py                 | 17 -----------------
 tests/rag/test_ingest.py                        | 17 -----------------
 tests/rag/test_ml_models/test_BedrockModel.py   | 16 ----------------
 tests/rag/test_ml_models/test_CohereModel.py    | 17 -----------------
 tests/rag/test_ml_models/test_OpenAIModel.py    | 16 ----------------
 tests/rag/test_ml_models/test_PyTorchModel.py   | 17 -----------------
 tests/rag/test_ml_models/test_SageMakerModel.py | 17 -----------------
 tests/rag/test_opensearch_connector.py          | 17 -----------------
 tests/rag/test_query.py                         | 16 ----------------
 tests/rag/test_rag.py                           | 16 ----------------
 tests/rag/test_rag_setup.py                     | 17 -----------------
 tests/rag/test_serverless.py                    | 16 ----------------
 25 files changed, 20 insertions(+), 354 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
index e69de29b..43d9d3f4 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
@@ -0,0 +1,6 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
index e69de29b..43d9d3f4 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
@@ -0,0 +1,6 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
index 3215273c..4b1b4ba4 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import json
 from colorama import Fore, Style
 
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
index 01c2d1dd..41c58a44 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
index b1bda520..3bee6c5e 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
@@ -4,23 +4,6 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
index ed72eaa2..951e0f50 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
@@ -4,23 +4,6 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import json
 from colorama import Fore, Style
 import time
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
index f5163629..4485d2c0 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
@@ -4,23 +4,6 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import json
 from colorama import Fore, Style
 import os
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
index 2f7975ed..60252e66 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
@@ -4,23 +4,6 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import json
 from colorama import Fore, Style
 
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
index e69de29b..43d9d3f4 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
@@ -0,0 +1,6 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index f9207853..d499ff64 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -1,10 +1,9 @@
 # SPDX-License-Identifier: Apache-2.0
-
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors.
-# See GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
 
 import boto3
 import botocore
diff --git a/tests/rag/test_AiConnectorClass.py b/tests/rag/test_AiConnectorClass.py
index 5ee3f420..db5d73dd 100644
--- a/tests/rag/test_AiConnectorClass.py
+++ b/tests/rag/test_AiConnectorClass.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock
 import json
diff --git a/tests/rag/test_IAMRoleHelper.py b/tests/rag/test_IAMRoleHelper.py
index a58fd933..d2b18eff 100644
--- a/tests/rag/test_IAMRoleHelper.py
+++ b/tests/rag/test_IAMRoleHelper.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock
 from botocore.exceptions import ClientError
diff --git a/tests/rag/test_Model_Register.py b/tests/rag/test_Model_Register.py
index 530149df..57b82deb 100644
--- a/tests/rag/test_Model_Register.py
+++ b/tests/rag/test_Model_Register.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock, Mock
 import sys
diff --git a/tests/rag/test_SecretsHelper.py b/tests/rag/test_SecretsHelper.py
index cde69492..e349b53b 100644
--- a/tests/rag/test_SecretsHelper.py
+++ b/tests/rag/test_SecretsHelper.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock
 from botocore.exceptions import ClientError
diff --git a/tests/rag/test_ingest.py b/tests/rag/test_ingest.py
index ac4c9f10..d47f4b30 100644
--- a/tests/rag/test_ingest.py
+++ b/tests/rag/test_ingest.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock, mock_open
 import os
diff --git a/tests/rag/test_ml_models/test_BedrockModel.py b/tests/rag/test_ml_models/test_BedrockModel.py
index dd32704c..71dc8a21 100644
--- a/tests/rag/test_ml_models/test_BedrockModel.py
+++ b/tests/rag/test_ml_models/test_BedrockModel.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import unittest
 from unittest.mock import Mock, patch, call
 import json
diff --git a/tests/rag/test_ml_models/test_CohereModel.py b/tests/rag/test_ml_models/test_CohereModel.py
index 79b9f662..4e499090 100644
--- a/tests/rag/test_ml_models/test_CohereModel.py
+++ b/tests/rag/test_ml_models/test_CohereModel.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import Mock, patch, call
 import json
diff --git a/tests/rag/test_ml_models/test_OpenAIModel.py b/tests/rag/test_ml_models/test_OpenAIModel.py
index 1dc6f6f7..0d225e3c 100644
--- a/tests/rag/test_ml_models/test_OpenAIModel.py
+++ b/tests/rag/test_ml_models/test_OpenAIModel.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import unittest
 from unittest.mock import Mock, patch, call
 import json
diff --git a/tests/rag/test_ml_models/test_PyTorchModel.py b/tests/rag/test_ml_models/test_PyTorchModel.py
index 6733315d..301f6259 100644
--- a/tests/rag/test_ml_models/test_PyTorchModel.py
+++ b/tests/rag/test_ml_models/test_PyTorchModel.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import Mock, patch, call, mock_open
 import json
diff --git a/tests/rag/test_ml_models/test_SageMakerModel.py b/tests/rag/test_ml_models/test_SageMakerModel.py
index 46c880ad..f6443f4a 100644
--- a/tests/rag/test_ml_models/test_SageMakerModel.py
+++ b/tests/rag/test_ml_models/test_SageMakerModel.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import Mock, patch, call
 import json
diff --git a/tests/rag/test_opensearch_connector.py b/tests/rag/test_opensearch_connector.py
index 25f5364f..331372a7 100644
--- a/tests/rag/test_opensearch_connector.py
+++ b/tests/rag/test_opensearch_connector.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock, Mock
 from opensearchpy import OpenSearch, AWSV4SignerAuth, exceptions as opensearch_exceptions
diff --git a/tests/rag/test_query.py b/tests/rag/test_query.py
index d2e0cf99..55d3bcb3 100644
--- a/tests/rag/test_query.py
+++ b/tests/rag/test_query.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import unittest
 from unittest.mock import patch, MagicMock
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.query import Query
diff --git a/tests/rag/test_rag.py b/tests/rag/test_rag.py
index cf4c54d1..3b96f010 100644
--- a/tests/rag/test_rag.py
+++ b/tests/rag/test_rag.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import unittest
 from unittest.mock import patch, MagicMock, Mock
 import sys
diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
index 1cdc6b85..7ee990f9 100644
--- a/tests/rag/test_rag_setup.py
+++ b/tests/rag/test_rag_setup.py
@@ -5,23 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
 import unittest
 from unittest.mock import patch, MagicMock
 import os
diff --git a/tests/rag/test_serverless.py b/tests/rag/test_serverless.py
index e6d89608..1792484a 100644
--- a/tests/rag/test_serverless.py
+++ b/tests/rag/test_serverless.py
@@ -5,22 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-#  Licensed to Elasticsearch B.V. under one or more contributor
-#  license agreements. See the NOTICE file distributed with
-#  this work for additional information regarding copyright
-#  ownership. Elasticsearch B.V. licenses this file to you under
-#  the Apache License, Version 2.0 (the "License"); you may
-#  not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-# 	http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
 import unittest
 from unittest.mock import patch, MagicMock, Mock
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless

From 2c40ce01e709fd9cba941a7455bebc4e91db43fc Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 6 Dec 2024 21:11:02 -0800
Subject: [PATCH 34/42] Fixed UT, Ran Lint nox, fixed code and unused
 enviroment variable issues.

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/IAMRoleHelper.py  | 149 +++--
 opensearch_py_ml/ml_commons/SecretsHelper.py  |  29 +-
 .../ml_commons/rag_pipeline/__init__.py       |   9 +-
 .../rag_pipeline/rag/AIConnectorHelper.py     | 357 ++++++-----
 .../ml_commons/rag_pipeline/rag/__init__.py   |   9 +-
 .../rag_pipeline/rag/embedding_client.py      |  25 +-
 .../ml_commons/rag_pipeline/rag/ingest.py     | 156 ++---
 .../rag/ml_models/BedrockModel.py             |  70 ++-
 .../rag_pipeline/rag/ml_models/CohereModel.py | 190 +++---
 .../rag/ml_models/HuggingFaceModel.py         | 103 +--
 .../rag_pipeline/rag/ml_models/OpenAIModel.py | 194 +++---
 .../rag/ml_models/PyTorchModel.py             | 144 +++--
 .../rag/ml_models/SageMakerModel.py           |  64 +-
 .../rag_pipeline/rag/ml_models/__init__.py    |   9 +-
 .../rag_pipeline/rag/model_register.py        | 208 +++---
 .../rag_pipeline/rag/opensearch_connector.py  | 160 +++--
 .../ml_commons/rag_pipeline/rag/query.py      | 207 +++---
 .../ml_commons/rag_pipeline/rag/rag.py        |  85 +--
 .../ml_commons/rag_pipeline/rag/rag_setup.py  | 594 +++++++++++-------
 .../ml_commons/rag_pipeline/rag/serverless.py | 208 ++++--
 setup.py                                      |   7 +-
 tests/rag/test_AiConnectorClass.py            | 537 +++++++---------
 tests/rag/test_IAMRoleHelper.py               | 233 +++----
 tests/rag/test_Model_Register.py              | 238 ++++---
 tests/rag/test_SecretsHelper.py               | 117 ++--
 tests/rag/test_embedding_client.py            | 103 +++
 tests/rag/test_ingest.py                      | 244 +++----
 tests/rag/test_ml_models/test_BedrockModel.py |  76 ++-
 tests/rag/test_ml_models/test_CohereModel.py  | 121 ++--
 tests/rag/test_ml_models/test_OpenAIModel.py  | 121 ++--
 tests/rag/test_ml_models/test_PyTorchModel.py | 167 +++--
 .../rag/test_ml_models/test_SageMakerModel.py | 124 ++--
 tests/rag/test_opensearch_connector.py        | 248 +++++---
 tests/rag/test_query.py                       | 289 ++++-----
 tests/rag/test_rag.py                         | 127 ++--
 tests/rag/test_rag_setup.py                   | 296 ++++-----
 tests/rag/test_serverless.py                  | 216 ++++---
 37 files changed, 3678 insertions(+), 2556 deletions(-)
 create mode 100644 tests/rag/test_embedding_client.py

diff --git a/opensearch_py_ml/ml_commons/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
index b4b5de90..53feb1a8 100644
--- a/opensearch_py_ml/ml_commons/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
@@ -5,10 +5,11 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import boto3
 import json
-from botocore.exceptions import ClientError
+
+import boto3
 import requests
+from botocore.exceptions import ClientError
 
 
 class IAMRoleHelper:
@@ -16,11 +17,19 @@ class IAMRoleHelper:
     Helper class for managing IAM roles and their interactions with OpenSearch.
     """
 
-    def __init__(self, region, opensearch_domain_url=None, opensearch_domain_username=None,
-                 opensearch_domain_password=None, aws_user_name=None, aws_role_name=None, opensearch_domain_arn=None):
+    def __init__(
+        self,
+        region,
+        opensearch_domain_url=None,
+        opensearch_domain_username=None,
+        opensearch_domain_password=None,
+        aws_user_name=None,
+        aws_role_name=None,
+        opensearch_domain_arn=None,
+    ):
         """
         Initialize the IAMRoleHelper with AWS and OpenSearch configurations.
-        
+
         :param region: AWS region.
         :param opensearch_domain_url: URL of the OpenSearch domain.
         :param opensearch_domain_username: Username for OpenSearch domain authentication.
@@ -40,17 +49,17 @@ def __init__(self, region, opensearch_domain_url=None, opensearch_domain_usernam
     def role_exists(self, role_name):
         """
         Check if an IAM role exists.
-        
+
         :param role_name: Name of the IAM role.
         :return: True if the role exists, False otherwise.
         """
-        iam_client = boto3.client('iam')
+        iam_client = boto3.client("iam")
 
         try:
             iam_client.get_role(RoleName=role_name)
             return True
         except ClientError as e:
-            if e.response['Error']['Code'] == 'NoSuchEntity':
+            if e.response["Error"]["Code"] == "NoSuchEntity":
                 return False
             else:
                 print(f"An error occurred: {e}")
@@ -59,64 +68,72 @@ def role_exists(self, role_name):
     def delete_role(self, role_name):
         """
         Delete an IAM role along with its attached policies.
-        
+
         :param role_name: Name of the IAM role to delete.
         """
-        iam_client = boto3.client('iam')
+        iam_client = boto3.client("iam")
 
         try:
             # Detach managed policies from the role
-            policies = iam_client.list_attached_role_policies(RoleName=role_name)['AttachedPolicies']
+            policies = iam_client.list_attached_role_policies(RoleName=role_name)[
+                "AttachedPolicies"
+            ]
             for policy in policies:
-                iam_client.detach_role_policy(RoleName=role_name, PolicyArn=policy['PolicyArn'])
-            print(f'All managed policies detached from role {role_name}.')
+                iam_client.detach_role_policy(
+                    RoleName=role_name, PolicyArn=policy["PolicyArn"]
+                )
+            print(f"All managed policies detached from role {role_name}.")
 
             # Delete inline policies associated with the role
-            inline_policies = iam_client.list_role_policies(RoleName=role_name)['PolicyNames']
+            inline_policies = iam_client.list_role_policies(RoleName=role_name)[
+                "PolicyNames"
+            ]
             for policy_name in inline_policies:
-                iam_client.delete_role_policy(RoleName=role_name, PolicyName=policy_name)
-            print(f'All inline policies deleted from role {role_name}.')
+                iam_client.delete_role_policy(
+                    RoleName=role_name, PolicyName=policy_name
+                )
+            print(f"All inline policies deleted from role {role_name}.")
 
             # Finally, delete the IAM role
             iam_client.delete_role(RoleName=role_name)
-            print(f'Role {role_name} deleted.')
+            print(f"Role {role_name} deleted.")
 
         except ClientError as e:
-            if e.response['Error']['Code'] == 'NoSuchEntity':
-                print(f'Role {role_name} does not exist.')
+            if e.response["Error"]["Code"] == "NoSuchEntity":
+                print(f"Role {role_name} does not exist.")
             else:
                 print(f"An error occurred: {e}")
 
     def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
         """
         Create a new IAM role with specified trust and inline policies.
-        
+
         :param role_name: Name of the IAM role to create.
         :param trust_policy_json: Trust policy document in JSON format.
         :param inline_policy_json: Inline policy document in JSON format.
         :return: ARN of the created role or None if creation failed.
         """
-        iam_client = boto3.client('iam')
+        iam_client = boto3.client("iam")
 
         try:
             # Create the role with the provided trust policy
             create_role_response = iam_client.create_role(
                 RoleName=role_name,
                 AssumeRolePolicyDocument=json.dumps(trust_policy_json),
-                Description='Role with custom trust and inline policies',
+                Description="Role with custom trust and inline policies",
             )
 
             # Retrieve the ARN of the newly created role
-            role_arn = create_role_response['Role']['Arn']
+            role_arn = create_role_response["Role"]["Arn"]
 
             # Attach the inline policy to the role
             iam_client.put_role_policy(
                 RoleName=role_name,
-                PolicyName='InlinePolicy',  # Replace with preferred policy name if needed
-                PolicyDocument=json.dumps(inline_policy_json)
+                PolicyName="InlinePolicy",  # Replace with preferred policy name if needed
+                PolicyDocument=json.dumps(inline_policy_json),
             )
 
-            print(f'Created role: {role_name}')
+            print(f"Created role: {role_name}")
             return role_arn
 
         except ClientError as e:
@@ -126,18 +143,18 @@ def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
     def get_role_arn(self, role_name):
         """
         Retrieve the ARN of an IAM role.
-        
+
         :param role_name: Name of the IAM role.
         :return: ARN of the role or None if not found.
         """
         if not role_name:
             return None
-        iam_client = boto3.client('iam')
+        iam_client = boto3.client("iam")
         try:
             response = iam_client.get_role(RoleName=role_name)
-            return response['Role']['Arn']
+            return response["Role"]["Arn"]
         except ClientError as e:
-            if e.response['Error']['Code'] == 'NoSuchEntity':
+            if e.response["Error"]["Code"] == "NoSuchEntity":
                 print(f"The requested role {role_name} does not exist")
                 return None
             else:
@@ -147,54 +164,64 @@ def get_role_arn(self, role_name):
     def get_role_details(self, role_name):
         """
         Print detailed information about an IAM role.
-        
+
         :param role_name: Name of the IAM role.
         """
-        iam = boto3.client('iam')
+        iam = boto3.client("iam")
 
         try:
             response = iam.get_role(RoleName=role_name)
-            role = response['Role']
+            role = response["Role"]
 
             print(f"Role Name: {role['RoleName']}")
             print(f"Role ID: {role['RoleId']}")
             print(f"ARN: {role['Arn']}")
             print(f"Creation Date: {role['CreateDate']}")
             print("Assume Role Policy Document:")
-            print(json.dumps(role['AssumeRolePolicyDocument'], indent=4, sort_keys=True))
+            print(
+                json.dumps(role["AssumeRolePolicyDocument"], indent=4, sort_keys=True)
+            )
 
             # List and print all inline policies attached to the role
             list_role_policies_response = iam.list_role_policies(RoleName=role_name)
 
-            for policy_name in list_role_policies_response['PolicyNames']:
-                get_role_policy_response = iam.get_role_policy(RoleName=role_name, PolicyName=policy_name)
+            for policy_name in list_role_policies_response["PolicyNames"]:
+                get_role_policy_response = iam.get_role_policy(
+                    RoleName=role_name, PolicyName=policy_name
+                )
                 print(f"Role Policy Name: {get_role_policy_response['PolicyName']}")
                 print("Role Policy Document:")
-                print(json.dumps(get_role_policy_response['PolicyDocument'], indent=4, sort_keys=True))
+                print(
+                    json.dumps(
+                        get_role_policy_response["PolicyDocument"],
+                        indent=4,
+                        sort_keys=True,
+                    )
+                )
 
         except ClientError as e:
-            if e.response['Error']['Code'] == 'NoSuchEntity':
-                print(f'Role {role_name} does not exist.')
+            if e.response["Error"]["Code"] == "NoSuchEntity":
+                print(f"Role {role_name} does not exist.")
             else:
                 print(f"An error occurred: {e}")
 
     def get_user_arn(self, username):
         """
         Retrieve the ARN of an IAM user.
-        
+
         :param username: Name of the IAM user.
         :return: ARN of the user or None if not found.
         """
         if not username:
             return None
-        iam_client = boto3.client('iam')
+        iam_client = boto3.client("iam")
 
         try:
             response = iam_client.get_user(UserName=username)
-            user_arn = response['User']['Arn']
+            user_arn = response["User"]["Arn"]
             return user_arn
         except ClientError as e:
-            if e.response['Error']['Code'] == 'NoSuchEntity':
+            if e.response["Error"]["Code"] == "NoSuchEntity":
                 print(f"IAM user '{username}' not found.")
                 return None
             else:
@@ -204,12 +231,12 @@ def get_user_arn(self, username):
     def assume_role(self, role_arn, role_session_name="your_session_name"):
         """
         Assume an IAM role and obtain temporary security credentials.
-        
+
         :param role_arn: ARN of the IAM role to assume.
         :param role_session_name: Identifier for the assumed role session.
         :return: Temporary security credentials or None if the operation fails.
         """
-        sts_client = boto3.client('sts')
+        sts_client = boto3.client("sts")
 
         try:
             assumed_role_object = sts_client.assume_role(
@@ -228,16 +255,16 @@ def assume_role(self, role_arn, role_session_name="your_session_name"):
     def map_iam_role_to_backend_role(self, iam_role_arn):
         """
         Map an IAM role to an OpenSearch backend role for access control.
-        
+
         :param iam_role_arn: ARN of the IAM role to map.
         """
-        os_security_role = 'ml_full_access'  # Defines the OpenSearch security role to map to
-        url = f'{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}'
+        os_security_role = (
+            "ml_full_access"  # Defines the OpenSearch security role to map to
+        )
+        url = f"{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}"
 
-        payload = {
-            "backend_roles": [iam_role_arn]
-        }
-        headers = {'Content-Type': 'application/json'}
+        payload = {"backend_roles": [iam_role_arn]}
+        headers = {"Content-Type": "application/json"}
 
         try:
             response = requests.put(
@@ -245,13 +272,17 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
                 auth=(self.opensearch_domain_username, self.opensearch_domain_password),
                 json=payload,
                 headers=headers,
-                verify=True
+                verify=True,
             )
 
             if response.status_code == 200:
-                print(f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'.")
+                print(
+                    f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'."
+                )
             else:
-                print(f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}")
+                print(
+                    f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}"
+                )
                 print(f"Response: {response.text}")
         except requests.exceptions.RequestException as e:
             print(f"HTTP request failed: {e}")
@@ -259,12 +290,12 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
     def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
         Extract the IAM user name from an IAM principal ARN.
-        
+
         :param iam_principal_arn: ARN of the IAM principal.
         :return: IAM user name or None if extraction fails.
         """
         # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
-        if iam_principal_arn and ':user/' in iam_principal_arn:
-            return iam_principal_arn.split(':user/')[-1]
+        if iam_principal_arn and ":user/" in iam_principal_arn:
+            return iam_principal_arn.split(":user/")[-1]
         else:
-            return None
\ No newline at end of file
+            return None
diff --git a/opensearch_py_ml/ml_commons/SecretsHelper.py b/opensearch_py_ml/ml_commons/SecretsHelper.py
index c675c12c..bd3303e0 100644
--- a/opensearch_py_ml/ml_commons/SecretsHelper.py
+++ b/opensearch_py_ml/ml_commons/SecretsHelper.py
@@ -5,9 +5,10 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
+import json
 import logging
+
 import boto3
-import json
 from botocore.exceptions import ClientError
 
 # Configure the logger for this module
@@ -36,14 +37,14 @@ def secret_exists(self, secret_name: str) -> bool:
         :return: True if the secret exists, False otherwise.
         """
         # Initialize the Secrets Manager client
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Attempt to retrieve the secret value
             secretsmanager.get_secret_value(SecretId=secret_name)
             return True
         except ClientError as e:
             # If the secret does not exist, return False
-            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+            if e.response["Error"]["Code"] == "ResourceNotFoundException":
                 return False
             else:
                 # Log other client errors and return False
@@ -58,14 +59,14 @@ def get_secret_arn(self, secret_name: str) -> str:
         :return: ARN of the secret if found, None otherwise.
         """
         # Initialize the Secrets Manager client
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Describe the secret to get its details
             response = secretsmanager.describe_secret(SecretId=secret_name)
-            return response['ARN']
+            return response["ARN"]
         except ClientError as e:
             # Handle the case where the secret does not exist
-            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+            if e.response["Error"]["Code"] == "ResourceNotFoundException":
                 logger.warning(f"The requested secret {secret_name} was not found")
                 return None
             else:
@@ -81,14 +82,14 @@ def get_secret(self, secret_name: str) -> str:
         :return: Secret value as a string if found, None otherwise.
         """
         # Initialize the Secrets Manager client
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Get the secret value
             response = secretsmanager.get_secret_value(SecretId=secret_name)
-            return response.get('SecretString')
+            return response.get("SecretString")
         except ClientError as e:
             # Handle the case where the secret does not exist
-            if e.response['Error']['Code'] == 'ResourceNotFoundException':
+            if e.response["Error"]["Code"] == "ResourceNotFoundException":
                 logger.warning("The requested secret was not found")
                 return None
             else:
@@ -105,7 +106,7 @@ def create_secret(self, secret_name: str, secret_value: dict) -> str:
         :return: ARN of the created secret if successful, None otherwise.
         """
         # Initialize the Secrets Manager client
-        secretsmanager = boto3.client('secretsmanager', region_name=self.region)
+        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Create the secret with the provided name and value
             response = secretsmanager.create_secret(
@@ -113,9 +114,9 @@ def create_secret(self, secret_name: str, secret_value: dict) -> str:
                 SecretString=json.dumps(secret_value),
             )
             # Log success and return the secret's ARN
-            logger.info(f'Secret {secret_name} created successfully.')
-            return response['ARN']
+            logger.info(f"Secret {secret_name} created successfully.")
+            return response["ARN"]
         except ClientError as e:
             # Log errors during secret creation and return None
-            logger.error(f'Error creating secret: {e}')
-            return None
\ No newline at end of file
+            logger.error(f"Error creating secret: {e}")
+            return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
index 43d9d3f4..3a3fa0f8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
@@ -3,4 +3,11 @@
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
\ No newline at end of file
+# GitHub history for details.
+
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index 9d795c52..8d3d93de 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -5,20 +5,21 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import boto3
 import json
+import time
+from urllib.parse import urlparse
+
+import boto3
 import requests
+from opensearchpy import OpenSearch, RequestsHttpConnection
 from requests.auth import HTTPBasicAuth
 from requests_aws4auth import AWS4Auth
-import time
-from opensearchpy import OpenSearch, RequestsHttpConnection
-from urllib.parse import urlparse
 
 from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
-from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
-from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
 from opensearch_py_ml.ml_commons.ml_commons_client import MLCommonClient
+from opensearch_py_ml.ml_commons.model_access_control import ModelAccessControl
 from opensearch_py_ml.ml_commons.model_connector import Connector
+from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
 
 
 class AIConnectorHelper:
@@ -26,8 +27,16 @@ class AIConnectorHelper:
     Helper class for managing AI connectors and models in OpenSearch.
     """
 
-    def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
-                 opensearch_domain_password, aws_user_name, aws_role_name, opensearch_domain_url):
+    def __init__(
+        self,
+        region,
+        opensearch_domain_name,
+        opensearch_domain_username,
+        opensearch_domain_password,
+        aws_user_name,
+        aws_role_name,
+        opensearch_domain_url,
+    ):
         """
         Initialize the AIConnectorHelper with necessary AWS and OpenSearch configurations.
         """
@@ -40,7 +49,9 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
         self.opensearch_domain_url = opensearch_domain_url
 
         # Retrieve OpenSearch domain information
-        domain_endpoint, domain_arn = self.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+        domain_endpoint, domain_arn = self.get_opensearch_domain_info(
+            self.region, self.opensearch_domain_name
+        )
         if domain_arn:
             self.opensearch_domain_arn = domain_arn
         else:
@@ -50,15 +61,18 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
         # Parse the OpenSearch domain URL to extract host and port
         parsed_url = urlparse(self.opensearch_domain_url)
         host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)
+        port = parsed_url.port or (443 if parsed_url.scheme == "https" else 9200)
 
         # Initialize OpenSearch client
         self.opensearch_client = OpenSearch(
-            hosts=[{'host': host, 'port': port}],
-            http_auth=(self.opensearch_domain_username, self.opensearch_domain_password),
-            use_ssl=(parsed_url.scheme == 'https'),
+            hosts=[{"host": host, "port": port}],
+            http_auth=(
+                self.opensearch_domain_username,
+                self.opensearch_domain_password,
+            ),
+            use_ssl=(parsed_url.scheme == "https"),
             verify_certs=True,
-            connection_class=RequestsHttpConnection
+            connection_class=RequestsHttpConnection,
         )
 
         # Initialize ModelAccessControl for managing model groups
@@ -72,11 +86,11 @@ def __init__(self, region, opensearch_domain_name, opensearch_domain_username,
             opensearch_domain_password=self.opensearch_domain_password,
             aws_user_name=self.aws_user_name,
             aws_role_name=self.aws_role_name,
-            opensearch_domain_arn=self.opensearch_domain_arn
+            opensearch_domain_arn=self.opensearch_domain_arn,
         )
 
         self.secret_helper = SecretHelper(self.region)
-        
+
         # Initialize MLCommonClient for reuse of get_task_info
         self.ml_commons_client = MLCommonClient(self.opensearch_client)
 
@@ -86,11 +100,11 @@ def get_opensearch_domain_info(region, domain_name):
         Retrieve the OpenSearch domain endpoint and ARN based on the domain name and region.
         """
         try:
-            opensearch_client = boto3.client('opensearch', region_name=region)
+            opensearch_client = boto3.client("opensearch", region_name=region)
             response = opensearch_client.describe_domain(DomainName=domain_name)
-            domain_status = response['DomainStatus']
-            domain_endpoint = domain_status.get('Endpoint')
-            domain_arn = domain_status['ARN']
+            domain_status = response["DomainStatus"]
+            domain_endpoint = domain_status.get("Endpoint")
+            domain_arn = domain_status["ARN"]
             return domain_endpoint, domain_arn
         except Exception as e:
             print(f"Error retrieving OpenSearch domain info: {e}")
@@ -100,7 +114,9 @@ def get_ml_auth(self, create_connector_role_name):
         """
         Obtain AWS4Auth credentials for ML API calls using the specified IAM role.
         """
-        create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
+        create_connector_role_arn = self.iam_helper.get_role_arn(
+            create_connector_role_name
+        )
         if not create_connector_role_arn:
             raise Exception(f"IAM role '{create_connector_role_name}' not found.")
 
@@ -109,7 +125,7 @@ def get_ml_auth(self, create_connector_role_name):
             temp_credentials["AccessKeyId"],
             temp_credentials["SecretAccessKey"],
             self.region,
-            'es',
+            "es",
             session_token=temp_credentials["SessionToken"],
         )
         return awsauth
@@ -120,33 +136,35 @@ def create_connector(self, create_connector_role_name, payload):
         Reusing create_standalone_connector from Connector class.
         """
         # Assume role and create a temporary authenticated OS client
-        create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
+        create_connector_role_arn = self.iam_helper.get_role_arn(
+            create_connector_role_name
+        )
         temp_credentials = self.iam_helper.assume_role(create_connector_role_arn)
         temp_awsauth = AWS4Auth(
             temp_credentials["AccessKeyId"],
             temp_credentials["SecretAccessKey"],
             self.region,
-            'es',
+            "es",
             session_token=temp_credentials["SessionToken"],
         )
 
         parsed_url = urlparse(self.opensearch_domain_url)
         host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)
+        port = parsed_url.port or (443 if parsed_url.scheme == "https" else 9200)
 
         temp_os_client = OpenSearch(
-            hosts=[{'host': host, 'port': port}],
+            hosts=[{"host": host, "port": port}],
             http_auth=temp_awsauth,
-            use_ssl=(parsed_url.scheme == 'https'),
+            use_ssl=(parsed_url.scheme == "https"),
             verify_certs=True,
-            connection_class=RequestsHttpConnection
+            connection_class=RequestsHttpConnection,
         )
 
         temp_connector = Connector(temp_os_client)
         response = temp_connector.create_standalone_connector(payload)
 
         print(response)
-        connector_id = response.get('connector_id')
+        connector_id = response.get("connector_id")
         return connector_id
 
     def get_task(self, task_id, create_connector_role_name):
@@ -163,19 +181,29 @@ def get_task(self, task_id, create_connector_role_name):
             print(f"Error in get_task: {e}")
             raise
 
-    def create_model(self, model_name, description, connector_id, create_connector_role_name, deploy=True):
+    def create_model(
+        self,
+        model_name,
+        description,
+        connector_id,
+        create_connector_role_name,
+        deploy=True,
+    ):
         """
         Create a new model in OpenSearch and optionally deploy it.
         """
         try:
             # Use ModelAccessControl methods directly without wrapping
-            model_group_id = self.model_access_control.get_model_group_id_by_name(model_name)
+            model_group_id = self.model_access_control.get_model_group_id_by_name(
+                model_name
+            )
             if not model_group_id:
                 self.model_access_control.register_model_group(
-                    name=model_name,
-                    description=description
+                    name=model_name, description=description
+                )
+                model_group_id = self.model_access_control.get_model_group_id_by_name(
+                    model_name
                 )
-                model_group_id = self.model_access_control.get_model_group_id_by_name(model_name)
                 if not model_group_id:
                     raise Exception("Failed to create model group.")
 
@@ -184,7 +212,7 @@ def create_model(self, model_name, description, connector_id, create_connector_r
                 "function_name": "remote",
                 "description": description,
                 "model_group_id": model_group_id,
-                "connector_id": connector_id
+                "connector_id": connector_id,
             }
             headers = {"Content-Type": "application/json"}
             deploy_str = str(deploy).lower()
@@ -192,30 +220,36 @@ def create_model(self, model_name, description, connector_id, create_connector_r
             awsauth = self.get_ml_auth(create_connector_role_name)
 
             response = requests.post(
-                f'{self.opensearch_domain_url}/_plugins/_ml/models/_register?deploy={deploy_str}',
+                f"{self.opensearch_domain_url}/_plugins/_ml/models/_register?deploy={deploy_str}",
                 auth=awsauth,
                 json=payload,
-                headers=headers
+                headers=headers,
             )
 
             print("Create Model Response:", response.text)
             response_data = json.loads(response.text)
 
-            if 'model_id' in response_data:
-                return response_data['model_id']
-            elif 'task_id' in response_data:
+            if "model_id" in response_data:
+                return response_data["model_id"]
+            elif "task_id" in response_data:
                 # Handle asynchronous task
                 time.sleep(2)  # Wait for task to complete
-                task_response = self.get_task(response_data['task_id'], create_connector_role_name)
+                task_response = self.get_task(
+                    response_data["task_id"], create_connector_role_name
+                )
                 print("Task Response:", json.dumps(task_response))
-                if 'model_id' in task_response:
-                    return task_response['model_id']
+                if "model_id" in task_response:
+                    return task_response["model_id"]
                 else:
-                    raise KeyError(f"'model_id' not found in task response: {task_response}")
-            elif 'error' in response_data:
+                    raise KeyError(
+                        f"'model_id' not found in task response: {task_response}"
+                    )
+            elif "error" in response_data:
                 raise Exception(f"Error creating model: {response_data['error']}")
             else:
-                raise KeyError(f"The response does not contain 'model_id' or 'task_id'. Response content: {response_data}")
+                raise KeyError(
+                    f"The response does not contain 'model_id' or 'task_id'. Response content: {response_data}"
+                )
         except Exception as e:
             print(f"Error in create_model: {e}")
             raise
@@ -226,9 +260,11 @@ def deploy_model(self, model_id):
         """
         headers = {"Content-Type": "application/json"}
         response = requests.post(
-            f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy',
-            auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
-            headers=headers
+            f"{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_deploy",
+            auth=HTTPBasicAuth(
+                self.opensearch_domain_username, self.opensearch_domain_password
+            ),
+            headers=headers,
         )
         print(f"Deploy Model Response: {response.text}")
         return response
@@ -239,27 +275,36 @@ def predict(self, model_id, payload):
         """
         headers = {"Content-Type": "application/json"}
         response = requests.post(
-            f'{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_predict',
-            auth=HTTPBasicAuth(self.opensearch_domain_username, self.opensearch_domain_password),
+            f"{self.opensearch_domain_url}/_plugins/_ml/models/{model_id}/_predict",
+            auth=HTTPBasicAuth(
+                self.opensearch_domain_username, self.opensearch_domain_password
+            ),
             json=payload,
-            headers=headers
+            headers=headers,
         )
         print("Predict Response:", response.text)
         return response
 
-    def create_connector_with_secret(self, secret_name, secret_value, connector_role_name, create_connector_role_name,
-                                     create_connector_input, sleep_time_in_seconds=10):
+    def create_connector_with_secret(
+        self,
+        secret_name,
+        secret_value,
+        connector_role_name,
+        create_connector_role_name,
+        create_connector_input,
+        sleep_time_in_seconds=10,
+    ):
         """
         Create a connector in OpenSearch using a secret for credentials.
         """
         # Step 1: Create Secret
-        print('Step1: Create Secret')
+        print("Step1: Create Secret")
         if not self.secret_helper.secret_exists(secret_name):
             secret_arn = self.secret_helper.create_secret(secret_name, secret_value)
         else:
-            print('Secret exists, skipping creation.')
+            print("Secret exists, skipping creation.")
             secret_arn = self.secret_helper.get_secret_arn(secret_name)
-        print('----------')
+        print("----------")
 
         # Step 2: Create IAM role configured in connector
         trust_policy = {
@@ -267,12 +312,10 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
             "Statement": [
                 {
                     "Effect": "Allow",
-                    "Principal": {
-                        "Service": "es.amazonaws.com"
-                    },
-                    "Action": "sts:AssumeRole"
+                    "Principal": {"Service": "es.amazonaws.com"},
+                    "Action": "sts:AssumeRole",
                 }
-            ]
+            ],
         }
 
         inline_policy = {
@@ -281,21 +324,23 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
                 {
                     "Action": [
                         "secretsmanager:GetSecretValue",
-                        "secretsmanager:DescribeSecret"
+                        "secretsmanager:DescribeSecret",
                     ],
                     "Effect": "Allow",
-                    "Resource": secret_arn
+                    "Resource": secret_arn,
                 }
-            ]
+            ],
         }
 
-        print('Step2: Create IAM role configured in connector')
+        print("Step2: Create IAM role configured in connector")
         if not self.iam_helper.role_exists(connector_role_name):
-            connector_role_arn = self.iam_helper.create_iam_role(connector_role_name, trust_policy, inline_policy)
+            connector_role_arn = self.iam_helper.create_iam_role(
+                connector_role_name, trust_policy, inline_policy
+            )
         else:
-            print('Role exists, skipping creation.')
+            print("Role exists, skipping creation.")
             connector_role_arn = self.iam_helper.get_role_arn(connector_role_name)
-        print('----------')
+        print("----------")
 
         # Step 3: Configure IAM role in OpenSearch
         # 3.1 Create IAM role for signing create connector request
@@ -303,25 +348,22 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
         role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
         statements = []
         if user_arn:
-            statements.append({
-                "Effect": "Allow",
-                "Principal": {
-                    "AWS": user_arn
-                },
-                "Action": "sts:AssumeRole"
-            })
+            statements.append(
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": user_arn},
+                    "Action": "sts:AssumeRole",
+                }
+            )
         if role_arn:
-            statements.append({
-                "Effect": "Allow",
-                "Principal": {
-                    "AWS": role_arn
-                },
-                "Action": "sts:AssumeRole"
-            })
-        trust_policy = {
-            "Version": "2012-10-17",
-            "Statement": statements
-        }
+            statements.append(
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": role_arn},
+                    "Action": "sts:AssumeRole",
+                }
+            )
+        trust_policy = {"Version": "2012-10-17", "Statement": statements}
 
         inline_policy = {
             "Version": "2012-10-17",
@@ -329,45 +371,53 @@ def create_connector_with_secret(self, secret_name, secret_value, connector_role
                 {
                     "Effect": "Allow",
                     "Action": "iam:PassRole",
-                    "Resource": connector_role_arn
+                    "Resource": connector_role_arn,
                 },
                 {
                     "Effect": "Allow",
                     "Action": "es:ESHttpPost",
-                    "Resource": self.opensearch_domain_arn
-                }
-            ]
+                    "Resource": self.opensearch_domain_arn,
+                },
+            ],
         }
 
-        print('Step 3: Configure IAM role in OpenSearch')
-        print('Step 3.1: Create IAM role for Signing create connector request')
+        print("Step 3: Configure IAM role in OpenSearch")
+        print("Step 3.1: Create IAM role for Signing create connector request")
         if not self.iam_helper.role_exists(create_connector_role_name):
-            create_connector_role_arn = self.iam_helper.create_iam_role(create_connector_role_name, trust_policy,
-                                                                       inline_policy)
+            create_connector_role_arn = self.iam_helper.create_iam_role(
+                create_connector_role_name, trust_policy, inline_policy
+            )
         else:
-            print('Role exists, skipping creation.')
-            create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
-        print('----------')
+            print("Role exists, skipping creation.")
+            create_connector_role_arn = self.iam_helper.get_role_arn(
+                create_connector_role_name
+            )
+        print("----------")
 
         # 3.2 Map IAM role to backend role in OpenSearch
-        print(f'Step 3.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
+        print(
+            f"Step 3.2: Map IAM role {create_connector_role_name} to OpenSearch permission role"
+        )
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
-        print('----------')
+        print("----------")
 
         # Step 4: Create connector
-        print('Step 4: Create connector in OpenSearch')
+        print("Step 4: Create connector in OpenSearch")
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
-        payload['credential'] = {
-            "secretArn": secret_arn,
-            "roleArn": connector_role_arn
-        }
+        payload["credential"] = {"secretArn": secret_arn, "roleArn": connector_role_arn}
         connector_id = self.create_connector(create_connector_role_name, payload)
-        print('----------')
+        print("----------")
         return connector_id
 
-    def create_connector_with_role(self, connector_role_inline_policy, connector_role_name, create_connector_role_name,
-                                   create_connector_input, sleep_time_in_seconds=10):
+    def create_connector_with_role(
+        self,
+        connector_role_inline_policy,
+        connector_role_name,
+        create_connector_role_name,
+        create_connector_input,
+        sleep_time_in_seconds=10,
+    ):
         """
         Create a connector in OpenSearch using an IAM role for credentials.
         """
@@ -377,22 +427,21 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
             "Statement": [
                 {
                     "Effect": "Allow",
-                    "Principal": {
-                        "Service": "es.amazonaws.com"
-                    },
-                    "Action": "sts:AssumeRole"
+                    "Principal": {"Service": "es.amazonaws.com"},
+                    "Action": "sts:AssumeRole",
                 }
-            ]
+            ],
         }
 
-        print('Step1: Create IAM role configured in connector')
+        print("Step1: Create IAM role configured in connector")
         if not self.iam_helper.role_exists(connector_role_name):
-            connector_role_arn = self.iam_helper.create_iam_role(connector_role_name, trust_policy,
-                                                                 connector_role_inline_policy)
+            connector_role_arn = self.iam_helper.create_iam_role(
+                connector_role_name, trust_policy, connector_role_inline_policy
+            )
         else:
-            print('Role exists, skipping creation.')
+            print("Role exists, skipping creation.")
             connector_role_arn = self.iam_helper.get_role_arn(connector_role_name)
-        print('----------')
+        print("----------")
 
         # Step 2: Configure IAM role in OpenSearch
         # 2.1 Create IAM role for signing create connector request
@@ -400,25 +449,22 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
         role_arn = self.iam_helper.get_role_arn(self.aws_role_name)
         statements = []
         if user_arn:
-            statements.append({
-                "Effect": "Allow",
-                "Principal": {
-                    "AWS": user_arn
-                },
-                "Action": "sts:AssumeRole"
-            })
+            statements.append(
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": user_arn},
+                    "Action": "sts:AssumeRole",
+                }
+            )
         if role_arn:
-            statements.append({
-                "Effect": "Allow",
-                "Principal": {
-                    "AWS": role_arn
-                },
-                "Action": "sts:AssumeRole"
-            })
-        trust_policy = {
-            "Version": "2012-10-17",
-            "Statement": statements
-        }
+            statements.append(
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": role_arn},
+                    "Action": "sts:AssumeRole",
+                }
+            )
+        trust_policy = {"Version": "2012-10-17", "Statement": statements}
 
         inline_policy = {
             "Version": "2012-10-17",
@@ -426,38 +472,41 @@ def create_connector_with_role(self, connector_role_inline_policy, connector_rol
                 {
                     "Effect": "Allow",
                     "Action": "iam:PassRole",
-                    "Resource": connector_role_arn
+                    "Resource": connector_role_arn,
                 },
                 {
                     "Effect": "Allow",
                     "Action": "es:ESHttpPost",
-                    "Resource": self.opensearch_domain_arn
-                }
-            ]
+                    "Resource": self.opensearch_domain_arn,
+                },
+            ],
         }
 
-        print('Step 2: Configure IAM role in OpenSearch')
-        print('Step 2.1: Create IAM role for Signing create connector request')
+        print("Step 2: Configure IAM role in OpenSearch")
+        print("Step 2.1: Create IAM role for Signing create connector request")
         if not self.iam_helper.role_exists(create_connector_role_name):
-            create_connector_role_arn = self.iam_helper.create_iam_role(create_connector_role_name, trust_policy,
-                                                                       inline_policy)
+            create_connector_role_arn = self.iam_helper.create_iam_role(
+                create_connector_role_name, trust_policy, inline_policy
+            )
         else:
-            print('Role exists, skipping creation.')
-            create_connector_role_arn = self.iam_helper.get_role_arn(create_connector_role_name)
-        print('----------')
+            print("Role exists, skipping creation.")
+            create_connector_role_arn = self.iam_helper.get_role_arn(
+                create_connector_role_name
+            )
+        print("----------")
 
         # 2.2 Map IAM role to backend role in OpenSearch
-        print(f'Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role')
+        print(
+            f"Step 2.2: Map IAM role {create_connector_role_name} to OpenSearch permission role"
+        )
         self.iam_helper.map_iam_role_to_backend_role(create_connector_role_arn)
-        print('----------')
+        print("----------")
 
         # Step 3: Create connector
-        print('Step 3: Create connector in OpenSearch')
+        print("Step 3: Create connector in OpenSearch")
         time.sleep(sleep_time_in_seconds)
         payload = create_connector_input
-        payload['credential'] = {
-            "roleArn": connector_role_arn
-        }
+        payload["credential"] = {"roleArn": connector_role_arn}
         connector_id = self.create_connector(create_connector_role_name, payload)
-        print('----------')
+        print("----------")
         return connector_id
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
index 43d9d3f4..3a3fa0f8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
@@ -3,4 +3,11 @@
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
\ No newline at end of file
+# GitHub history for details.
+
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py
index acfe6a45..5b0065a4 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/embedding_client.py
@@ -7,12 +7,15 @@
 
 import time
 
+
 class EmbeddingClient:
     def __init__(self, opensearch_client, embedding_model_id):
         self.opensearch_client = opensearch_client
         self.embedding_model_id = embedding_model_id
 
-    def get_text_embedding(self, text, max_retries=5, initial_delay=1, backoff_factor=2):
+    def get_text_embedding(
+        self, text, max_retries=5, initial_delay=1, backoff_factor=2
+    ):
         """
         Generate a text embedding using OpenSearch's ML API with retry logic.
 
@@ -25,30 +28,28 @@ def get_text_embedding(self, text, max_retries=5, initial_delay=1, backoff_facto
         delay = initial_delay
         for attempt in range(max_retries):
             try:
-                payload = {
-                    "text_docs": [text]
-                }
+                payload = {"text_docs": [text]}
                 response = self.opensearch_client.transport.perform_request(
                     method="POST",
                     url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
-                    body=payload
+                    body=payload,
                 )
-                inference_results = response.get('inference_results', [])
+                inference_results = response.get("inference_results", [])
                 if not inference_results:
                     print(f"No inference results returned for text: {text}")
                     return None
-                output = inference_results[0].get('output')
+                output = inference_results[0].get("output")
 
                 # Adjust the extraction of embedding data
                 if isinstance(output, list) and len(output) > 0:
                     embedding_dict = output[0]
-                    if isinstance(embedding_dict, dict) and 'data' in embedding_dict:
-                        embedding = embedding_dict['data']
+                    if isinstance(embedding_dict, dict) and "data" in embedding_dict:
+                        embedding = embedding_dict["data"]
                     else:
                         print(f"Unexpected embedding output format: {output}")
                         return None
-                elif isinstance(output, dict) and 'data' in output:
-                    embedding = output['data']
+                elif isinstance(output, dict) and "data" in output:
+                    embedding = output["data"]
                 else:
                     print(f"Unexpected embedding output format: {output}")
                     return None
@@ -60,4 +61,4 @@ def get_text_embedding(self, text, max_retries=5, initial_delay=1, backoff_facto
                     raise
                 time.sleep(delay)
                 delay *= backoff_factor
-        return None
\ No newline at end of file
+        return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
index dc0f186a..2544a226 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ingest.py
@@ -5,22 +5,22 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import os
-import glob
-import json
-import tiktoken
-from tqdm import tqdm
-from colorama import Fore, Style, init
-from typing import List, Dict
 import csv
+import json
+import os
+from typing import Dict, List
+
 import PyPDF2
-import boto3
-import botocore
-import time
-import random
+from colorama import Fore, Style, init
 from opensearchpy import exceptions as opensearch_exceptions
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import EmbeddingClient
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
+from tqdm import tqdm
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import (
+    EmbeddingClient,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
+    OpenSearchConnector,
+)
 
 # Initialize colorama for colored terminal output
 init(autoreset=True)  # Initialize colorama
@@ -38,13 +38,17 @@ def __init__(self, config):
         :param config: Configuration dictionary containing necessary parameters.
         """
         self.config = config
-        self.aws_region = config.get('region')
-        self.index_name = config.get('index_name')
+        self.aws_region = config.get("region")
+        self.index_name = config.get("index_name")
         self.bedrock_client = None
         self.opensearch = OpenSearchConnector(config)
-        self.embedding_model_id = config.get('embedding_model_id')
-        self.embedding_client = None  # Will be initialized after OpenSearch client is ready
-        self.pipeline_name = config.get('ingest_pipeline_name', 'text-chunking-ingest-pipeline')
+        self.embedding_model_id = config.get("embedding_model_id")
+        self.embedding_client = (
+            None  # Will be initialized after OpenSearch client is ready
+        )
+        self.pipeline_name = config.get(
+            "ingest_pipeline_name", "text-chunking-ingest-pipeline"
+        )
 
     def initialize_clients(self) -> bool:
         """
@@ -60,12 +64,14 @@ def initialize_clients(self) -> bool:
                 print("Embedding model ID is not set. Please run setup first.")
                 return False
 
-            self.embedding_client = EmbeddingClient(self.opensearch.opensearch_client, self.embedding_model_id)
+            self.embedding_client = EmbeddingClient(
+                self.opensearch.opensearch_client, self.embedding_model_id
+            )
             return True
         else:
             print("Failed to initialize OpenSearch client.")
             return False
-        
+
     def ingest_command(self, paths: List[str]):
         """
         Main ingestion command that processes and ingests all valid files from the provided paths.
@@ -84,15 +90,21 @@ def ingest_command(self, paths: List[str]):
                 print(f"{Fore.YELLOW}Invalid path: {path}{Style.RESET_ALL}")
 
         # Define supported file extensions
-        supported_extensions = ['.csv', '.txt', '.pdf']
-        valid_files = [f for f in all_files if any(f.lower().endswith(ext) for ext in supported_extensions)]
+        supported_extensions = [".csv", ".txt", ".pdf"]
+        valid_files = [
+            f
+            for f in all_files
+            if any(f.lower().endswith(ext) for ext in supported_extensions)
+        ]
 
         # Check if there are valid files to ingest
         if not valid_files:
             print(f"{Fore.RED}No valid files found for ingestion.{Style.RESET_ALL}")
             return
 
-        print(f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}")
+        print(
+            f"{Fore.GREEN}Found {len(valid_files)} valid files for ingestion.{Style.RESET_ALL}"
+        )
 
         # Process and ingest data from valid files
         self.process_and_ingest_data(valid_files)
@@ -110,9 +122,9 @@ def process_and_ingest_data(self, file_paths: List[str]):
         self.create_ingest_pipeline(self.pipeline_name)
 
         # Retrieve field names from the config
-        passage_text_field = self.config.get('passage_text_field', 'passage_text')
-        passage_chunk_field = self.config.get('passage_chunk_field', 'passage_chunk')
-        embedding_field = self.config.get('embedding_field', 'passage_embedding')
+        passage_text_field = self.config.get("passage_text_field", "passage_text")
+        self.config.get("passage_chunk_field", "passage_chunk")
+        embedding_field = self.config.get("embedding_field", "passage_embedding")
 
         all_documents = []
         for file_path in file_paths:
@@ -128,53 +140,65 @@ def process_and_ingest_data(self, file_paths: List[str]):
         error_count = 0
 
         # Progress bar for embedding generation
-        with tqdm(total=total_documents, bar_format='{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]') as pbar:
+        with tqdm(
+            total=total_documents,
+            bar_format="{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}]",
+        ) as pbar:
             for doc in all_documents:
                 try:
-                    embedding = self.embedding_client.get_text_embedding(doc['text'])
+                    embedding = self.embedding_client.get_text_embedding(doc["text"])
                     if embedding is not None:
-                        doc['embedding'] = embedding
+                        doc["embedding"] = embedding
                         success_count += 1
                     else:
                         error_count += 1
-                        print(f"{Fore.RED}Error generating embedding for document: {doc['text'][:50]}...{Style.RESET_ALL}")
+                        print(
+                            f"{Fore.RED}Error generating embedding for document: {doc['text'][:50]}...{Style.RESET_ALL}"
+                        )
                 except Exception as e:
                     error_count += 1
-                    print(f"{Fore.RED}Error processing document: {str(e)}{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Error processing document: {str(e)}{Style.RESET_ALL}"
+                    )
                 pbar.update(1)
-                pbar.set_postfix({'Success': success_count, 'Errors': error_count})
+                pbar.set_postfix({"Success": success_count, "Errors": error_count})
 
-        print(f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}")
-        print(f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}")
+        print(
+            f"\n{Fore.GREEN}Documents with successful embeddings: {success_count}{Style.RESET_ALL}"
+        )
+        print(
+            f"{Fore.RED}Documents with failed embeddings: {error_count}{Style.RESET_ALL}"
+        )
 
         # Check if there are documents to ingest
         if success_count == 0:
-            print(f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}No documents to ingest. Aborting ingestion.{Style.RESET_ALL}"
+            )
             return
 
         print(f"\n{Fore.YELLOW}Ingesting data into OpenSearch...{Style.RESET_ALL}")
         actions = []
         for doc in all_documents:
-            if 'embedding' in doc and doc['embedding'] is not None:
+            if "embedding" in doc and doc["embedding"] is not None:
                 action = {
                     "_op_type": "index",
                     "_index": self.index_name,
                     "_source": {
-                        passage_text_field: doc['text'],
-                        embedding_field: {
-                            "knn": doc['embedding']
-                        }
+                        passage_text_field: doc["text"],
+                        embedding_field: {"knn": doc["embedding"]},
                     },
-                    "pipeline": self.pipeline_name
+                    "pipeline": self.pipeline_name,
                 }
                 actions.append(action)
 
         # Bulk index the documents into OpenSearch
         success, failed = self.opensearch.bulk_index(actions)
-        print(f"\n{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}")
+        print(
+            f"\n{Fore.GREEN}Successfully ingested {success} documents.{Style.RESET_ALL}"
+        )
         print(f"{Fore.RED}Failed to ingest {failed} documents.{Style.RESET_ALL}")
 
-
     def create_ingest_pipeline(self, pipeline_id: str):
         """
         Creates an ingest pipeline in OpenSearch if it does not already exist.
@@ -186,14 +210,9 @@ def create_ingest_pipeline(self, pipeline_id: str):
             print(f"\nIngest pipeline '{pipeline_id}' already exists.")
         except opensearch_exceptions.NotFoundError:
             # Pipeline does not exist, create it
-            embedding_dimension = int(self.config.get('embedding_dimension', 768))
-            # Calculate token_limit based on embedding dimension if not set
-            token_limit = int(self.config.get('token_limit', int(embedding_dimension * 0.75)))
-            tokenizer = self.config.get('tokenizer', 'standard')
-            overlap_rate = float(self.config.get('overlap_rate', 0.2))
-            source_field = self.config.get('passage_text_field', 'passage_text')
-            target_field = self.config.get('passage_chunk_field', 'passage_chunk')
-            embedding_field = self.config.get('embedding_field', 'passage_embedding')
+            source_field = self.config.get("passage_text_field", "passage_text")
+            target_field = self.config.get("passage_chunk_field", "passage_chunk")
+            embedding_field = self.config.get("embedding_field", "passage_embedding")
             model_id = self.embedding_model_id
 
             pipeline_body = {
@@ -201,28 +220,22 @@ def create_ingest_pipeline(self, pipeline_id: str):
                 "processors": [
                     {
                         "text_chunking": {
-                            "algorithm": {
-                                "delimiter": {
-                                    "delimiter": "."
-                                }
-                            },
-                            "field_map": {
-                                source_field: target_field
-                            }
+                            "algorithm": {"delimiter": {"delimiter": "."}},
+                            "field_map": {source_field: target_field},
                         }
                     },
                     {
                         "text_embedding": {
                             "model_id": model_id,
-                            "field_map": {
-                                target_field: embedding_field
-                            }
+                            "field_map": {target_field: embedding_field},
                         }
-                    }
-                ]
+                    },
+                ],
             }
             # Create the ingest pipeline
-            self.opensearch.opensearch_client.ingest.put_pipeline(id=pipeline_id, body=pipeline_body)
+            self.opensearch.opensearch_client.ingest.put_pipeline(
+                id=pipeline_id, body=pipeline_body
+            )
             print(f"\nIngest pipeline '{pipeline_id}' created successfully.")
         except Exception as e:
             print(f"\nError checking or creating ingest pipeline: {e}")
@@ -236,11 +249,11 @@ def process_file(self, file_path: str) -> List[Dict[str, str]]:
         """
         _, file_extension = os.path.splitext(file_path)
 
-        if file_extension.lower() == '.csv':
+        if file_extension.lower() == ".csv":
             return self.process_csv(file_path)
-        elif file_extension.lower() == '.txt':
+        elif file_extension.lower() == ".txt":
             return self.process_txt(file_path)
-        elif file_extension.lower() == '.pdf':
+        elif file_extension.lower() == ".pdf":
             return self.process_pdf(file_path)
         else:
             print(f"Unsupported file type: {file_extension}")
@@ -254,7 +267,7 @@ def process_csv(self, file_path: str) -> List[Dict[str, str]]:
         :return: List of dictionaries with extracted text.
         """
         documents = []
-        with open(file_path, 'r', newline='', encoding='utf-8') as csvfile:
+        with open(file_path, "r", newline="", encoding="utf-8") as csvfile:
             reader = csv.DictReader(csvfile)
             for row in reader:
                 documents.append({"text": json.dumps(row)})
@@ -267,7 +280,7 @@ def process_txt(self, file_path: str) -> List[Dict[str, str]]:
         :param file_path: Path to the TXT file.
         :return: List containing a single dictionary with the file content.
         """
-        with open(file_path, 'r') as txtfile:
+        with open(file_path, "r") as txtfile:
             content = txtfile.read()
         return [{"text": content}]
 
@@ -279,11 +292,10 @@ def process_pdf(self, file_path: str) -> List[Dict[str, str]]:
         :return: List of dictionaries, each containing text from a page.
         """
         documents = []
-        with open(file_path, 'rb') as pdffile:
+        with open(file_path, "rb") as pdffile:
             pdf_reader = PyPDF2.PdfReader(pdffile)
             for page in pdf_reader.pages:
                 extracted_text = page.extract_text()
                 if extracted_text:  # Ensure that text was extracted
                     documents.append({"text": extracted_text})
         return documents
-
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
index 4b1b4ba4..c80ccc31 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/BedrockModel.py
@@ -6,13 +6,22 @@
 # GitHub history for details.
 
 import json
+
 from colorama import Fore, Style
 
+
 class BedrockModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the BedrockModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -36,7 +45,9 @@ def register_bedrock_model(self, helper, config, save_config_method):
             save_config_method (function): Method to save the configuration.
         """
         # Prompt for necessary inputs
-        bedrock_region = input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
+        bedrock_region = (
+            input(f"Enter your Bedrock region [{self.aws_region}]: ") or self.aws_region
+        )
         connector_role_name = "my_test_bedrock_connector_role"
         create_connector_role_name = "my_test_create_bedrock_connector_role"
 
@@ -47,9 +58,9 @@ def register_bedrock_model(self, helper, config, save_config_method):
                 {
                     "Action": ["bedrock:InvokeModel"],
                     "Effect": "Allow",
-                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1"
+                    "Resource": "arn:aws:bedrock:*::foundation-model/amazon.titan-embed-text-v1",
                 }
-            ]
+            ],
         }
 
         # Default connector input
@@ -58,10 +69,7 @@ def register_bedrock_model(self, helper, config, save_config_method):
             "description": "The connector to Bedrock Titan embedding model",
             "version": 1,
             "protocol": "aws_sigv4",
-            "parameters": {
-                "region": bedrock_region,
-                "service_name": "bedrock"
-            },
+            "parameters": {"region": bedrock_region, "service_name": "bedrock"},
             "actions": [
                 {
                     "action_type": "predict",
@@ -69,13 +77,13 @@ def register_bedrock_model(self, helper, config, save_config_method):
                     "url": f"https://bedrock-runtime.{bedrock_region}.amazonaws.com/model/amazon.titan-embed-text-v1/invoke",
                     "headers": {
                         "content-type": "application/json",
-                        "x-amz-content-sha256": "required"
+                        "x-amz-content-sha256": "required",
                     },
-                    "request_body": "{ \"inputText\": \"${parameters.inputText}\" }",
-                    "pre_process_function": "\n    StringBuilder builder = new StringBuilder();\n    builder.append(\"\\\"\");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append(\"\\\"\");\n    def parameters = \"{\" +\"\\\"inputText\\\":\" + builder + \"}\";\n    return  \"{\" +\"\\\"parameters\\\":\" + parameters + \"}\";",
-                    "post_process_function": "\n      def name = \"sentence_embedding\";\n      def dataType = \"FLOAT32\";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = \"{\" +\n                 \"\\\"name\\\":\\\"\" + name + \"\\\",\" +\n                 \"\\\"data_type\\\":\\\"\" + dataType + \"\\\",\" +\n                 \"\\\"shape\\\":\" + shape + \",\" +\n                 \"\\\"data\\\":\" + params.embedding +\n                 \"}\";\n      return json;\n    "
+                    "request_body": '{ "inputText": "${parameters.inputText}" }',
+                    "pre_process_function": '\n    StringBuilder builder = new StringBuilder();\n    builder.append("\\"");\n    String first = params.text_docs[0];\n    builder.append(first);\n    builder.append("\\"");\n    def parameters = "{" +"\\"inputText\\":" + builder + "}";\n    return  "{" +"\\"parameters\\":" + parameters + "}";',
+                    "post_process_function": '\n      def name = "sentence_embedding";\n      def dataType = "FLOAT32";\n      if (params.embedding == null || params.embedding.length == 0) {\n        return params.message;\n      }\n      def shape = [params.embedding.length];\n      def json = "{" +\n                 "\\"name\\":\\"" + name + "\\"," +\n                 "\\"data_type\\":\\"" + dataType + "\\"," +\n                 "\\"shape\\":" + shape + "," +\n                 "\\"data\\":" + params.embedding +\n                 "}";\n      return json;\n    ',
                 }
-            ]
+            ],
         }
 
         # Get model details from user
@@ -90,26 +98,36 @@ def register_bedrock_model(self, helper, config, save_config_method):
             connector_role_name,
             create_connector_role_name,
             create_connector_input,
-            sleep_time_in_seconds=10
+            sleep_time_in_seconds=10,
         )
 
         if not connector_id:
-            print(f"{Fore.RED}Failed to create Bedrock connector. Aborting.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to create Bedrock connector. Aborting.{Style.RESET_ALL}"
+            )
             return
 
         # Register model
         print("Registering Bedrock model...")
-        model_name = create_connector_input.get('name', 'Bedrock embedding model')
-        description = create_connector_input.get('description', 'Bedrock embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+        model_name = create_connector_input.get("name", "Bedrock embedding model")
+        description = create_connector_input.get(
+            "description", "Bedrock embedding model for semantic search"
+        )
+        model_id = helper.create_model(
+            model_name, description, connector_id, create_connector_role_name
+        )
 
         if not model_id:
-            print(f"{Fore.RED}Failed to create Bedrock model. Aborting.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to create Bedrock model. Aborting.{Style.RESET_ALL}"
+            )
             return
 
         # Save model_id to config
         self.save_model_id(config, save_config_method, model_id)
-        print(f"{Fore.GREEN}Bedrock model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+        print(
+            f"{Fore.GREEN}Bedrock model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}"
+        )
 
     def save_model_id(self, config, save_config_method, model_id):
         """
@@ -120,18 +138,20 @@ def save_model_id(self, config, save_config_method, model_id):
             save_config_method (function): Method to save the configuration.
             model_id (str): The model ID to save.
         """
-        config['embedding_model_id'] = model_id
+        config["embedding_model_id"] = model_id
         save_config_method(config)
 
     def get_custom_model_details(self, default_input):
-        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom model settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom model settings")
         choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
+        if choice == "1":
             return default_input
-        elif choice == '2':
+        elif choice == "2":
             print("Please enter your model details as a JSON object.")
             print("Example:")
             print(json.dumps(default_input, indent=2))
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
index 41c58a44..a7941eb0 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/CohereModel.py
@@ -6,13 +6,23 @@
 # GitHub history for details.
 
 import json
-from colorama import Fore, Style
 import time
+
+from colorama import Fore, Style
+
+
 class CohereModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the CohereModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -37,7 +47,7 @@ def register_cohere_model(self, helper, config, save_config_method):
         """
         # Prompt for necessary inputs
         secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'cohere_api_key'
+        secret_key = "cohere_api_key"
         cohere_api_key = input("Enter your Cohere API key: ")
         secret_value = {secret_key: cohere_api_key}
 
@@ -53,7 +63,7 @@ def register_cohere_model(self, helper, config, save_config_method):
             "parameters": {
                 "model": "embed-english-v3.0",
                 "input_type": "search_document",
-                "truncate": "END"
+                "truncate": "END",
             },
             "actions": [
                 {
@@ -62,13 +72,13 @@ def register_cohere_model(self, helper, config, save_config_method):
                     "url": "https://api.cohere.ai/v1/embed",
                     "headers": {
                         "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                        "Request-Source": "unspecified:opensearch"
+                        "Request-Source": "unspecified:opensearch",
                     },
-                    "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                    "request_body": '{ "texts": ${parameters.texts}, "truncate": "${parameters.truncate}", "model": "${parameters.model}", "input_type": "${parameters.input_type}" }',
                     "pre_process_function": "connector.pre_process.cohere.embedding",
-                    "post_process_function": "connector.post_process.cohere.embedding"
+                    "post_process_function": "connector.post_process.cohere.embedding",
                 }
-            ]
+            ],
         }
 
         # Get model details from user
@@ -83,7 +93,7 @@ def register_cohere_model(self, helper, config, save_config_method):
             connector_role_name,
             create_connector_role_name,
             create_connector_input,
-            sleep_time_in_seconds=10
+            sleep_time_in_seconds=10,
         )
 
         if not connector_id:
@@ -91,20 +101,28 @@ def register_cohere_model(self, helper, config, save_config_method):
             return
 
         # Register model
-        model_name = create_connector_input.get('name', 'Cohere embedding model')
-        description = create_connector_input.get('description', 'Cohere embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+        model_name = create_connector_input.get("name", "Cohere embedding model")
+        description = create_connector_input.get(
+            "description", "Cohere embedding model for semantic search"
+        )
+        model_id = helper.create_model(
+            model_name, description, connector_id, create_connector_role_name
+        )
 
         if not model_id:
             print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
-        config['embedding_model_id'] = model_id
+        config["embedding_model_id"] = model_id
         save_config_method(config)
-        print(f"{Fore.GREEN}Cohere model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+        print(
+            f"{Fore.GREEN}Cohere model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}"
+        )
 
-    def register_cohere_model_opensource(self, opensearch_client, config, save_config_method):
+    def register_cohere_model_opensource(
+        self, opensearch_client, config, save_config_method
+    ):
         """
         Register a Cohere embedding model in open-source OpenSearch.
 
@@ -118,12 +136,14 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
             print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
             return
 
-        print("\nDo you want to use the default configuration or provide custom settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom settings")
         config_choice = input("Enter your choice (1-2): ").strip()
 
-        if config_choice == '1':
+        if config_choice == "1":
             # Use default configurations
             connector_payload = {
                 "name": "Cohere Embedding Connector",
@@ -133,11 +153,9 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
                 "parameters": {
                     "model": "embed-english-v3.0",
                     "input_type": "search_document",
-                    "truncate": "END"
-                },
-                "credential": {
-                    "cohere_key": cohere_api_key
+                    "truncate": "END",
                 },
+                "credential": {"cohere_key": cohere_api_key},
                 "actions": [
                     {
                         "action_type": "predict",
@@ -145,19 +163,19 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
                         "url": "https://api.cohere.ai/v1/embed",
                         "headers": {
                             "Authorization": "Bearer ${credential.cohere_key}",
-                            "Request-Source": "unspecified:opensearch"
+                            "Request-Source": "unspecified:opensearch",
                         },
-                        "request_body": "{ \"texts\": ${parameters.texts}, \"truncate\": \"${parameters.truncate}\", \"model\": \"${parameters.model}\", \"input_type\": \"${parameters.input_type}\" }",
+                        "request_body": '{ "texts": ${parameters.texts}, "truncate": "${parameters.truncate}", "model": "${parameters.model}", "input_type": "${parameters.input_type}" }',
                         "pre_process_function": "connector.pre_process.cohere.embedding",
-                        "post_process_function": "connector.post_process.cohere.embedding"
+                        "post_process_function": "connector.post_process.cohere.embedding",
                     }
-                ]
+                ],
             }
             model_group_payload = {
                 "name": f"cohere_model_group_{int(time.time())}",
-                "description": "Model group for Cohere models"
+                "description": "Model group for Cohere models",
             }
-        elif config_choice == '2':
+        elif config_choice == "2":
             # Get custom configurations
             print("\nPlease enter your connector details as a JSON object.")
             connector_payload = self.get_custom_json_input()
@@ -169,7 +187,9 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
             if not model_group_payload:
                 return
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return
 
         # Register the connector
@@ -177,13 +197,17 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
             connector_response = opensearch_client.transport.perform_request(
                 method="POST",
                 url="/_plugins/_ml/connectors/_create",
-                body=connector_payload
+                body=connector_payload,
             )
-            connector_id = connector_response.get('connector_id')
+            connector_id = connector_response.get("connector_id")
             if not connector_id:
-                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}"
+                )
                 return
-            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+            print(
+                f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}"
+            )
         except Exception as ex:
             print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
             return
@@ -193,55 +217,70 @@ def register_cohere_model_opensource(self, opensearch_client, config, save_confi
             model_group_response = opensearch_client.transport.perform_request(
                 method="POST",
                 url="/_plugins/_ml/model_groups/_register",
-                body=model_group_payload
+                body=model_group_payload,
             )
-            model_group_id = model_group_response.get('model_group_id')
+            model_group_id = model_group_response.get("model_group_id")
             if not model_group_id:
-                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}"
+                )
                 return
-            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+            print(
+                f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}"
+            )
         except Exception as ex:
             print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
-            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
-                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
-                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            if "illegal_argument_exception" in str(ex) and "already being used" in str(
+                ex
+            ):
+                print(
+                    f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}"
+                )
+                model_group_id = str(ex).split("ID: ")[-1].strip("'.")
             else:
                 return
 
         # Create model payload
         model_payload = {
-            "name": connector_payload.get('name', 'Cohere embedding model'),
+            "name": connector_payload.get("name", "Cohere embedding model"),
             "function_name": "REMOTE",
             "model_group_id": model_group_id,
-            "description": connector_payload.get('description', 'Cohere embedding model for semantic search'),
-            "connector_id": connector_id
+            "description": connector_payload.get(
+                "description", "Cohere embedding model for semantic search"
+            ),
+            "connector_id": connector_id,
         }
 
         # Register the model
         try:
             response = opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
+                method="POST", url="/_plugins/_ml/models/_register", body=model_payload
             )
-            task_id = response.get('task_id')
+            task_id = response.get("task_id")
             if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}"
+                )
                 # Wait for the task to complete and retrieve the model_id
                 model_id = self.wait_for_model_registration(opensearch_client, task_id)
                 if model_id:
                     # Deploy the model
-                    deploy_response = opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    opensearch_client.transport.perform_request(
+                        method="POST", url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(
+                        f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}"
                     )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    config['embedding_model_id'] = model_id
+                    config["embedding_model_id"] = model_id
                     save_config_method(config)
                 else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}"
+                    )
             else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}"
+                )
         except Exception as ex:
             print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
 
@@ -256,14 +295,16 @@ def get_custom_model_details(self, default_input):
         Returns:
             dict or None: Custom or default model configuration, or None if invalid input.
         """
-        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom model settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom model settings")
         choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
+        if choice == "1":
             return default_input
-        elif choice == '2':
+        elif choice == "2":
             print("Please enter your model details as a JSON object.")
             print("Example:")
             print(json.dumps(default_input, indent=2))
@@ -275,7 +316,9 @@ def get_custom_model_details(self, default_input):
                 print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
                 return None
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return None
 
     def get_custom_json_input(self):
@@ -287,7 +330,9 @@ def get_custom_json_input(self):
             print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
             return None
 
-    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+    def wait_for_model_registration(
+        self, opensearch_client, task_id, timeout=600, interval=10
+    ):
         """
         Wait for the model registration task to complete and return the model_id.
 
@@ -304,21 +349,26 @@ def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, i
         while time.time() < end_time:
             try:
                 response = opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
+                    method="GET", url=f"/_plugins/_ml/tasks/{task_id}"
                 )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
+                state = response.get("state")
+                if state == "COMPLETED":
+                    model_id = response.get("model_id")
                     return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                elif state in ["FAILED", "STOPPED"]:
+                    print(
+                        f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}"
+                    )
                     return None
                 else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    print(
+                        f"Model registration task {task_id} is in state: {state}. Waiting..."
+                    )
                     time.sleep(interval)
             except Exception as ex:
                 print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
                 time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
\ No newline at end of file
+        print(
+            f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}"
+        )
+        return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
index 3bee6c5e..2dc048c0 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/HuggingFaceModel.py
@@ -5,14 +5,23 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 import json
-from colorama import Fore, Style
 import time
 
+from colorama import Fore, Style
+
+
 class HuggingFaceModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the HuggingFaceModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -35,28 +44,32 @@ def register_huggingface_model(self, opensearch_client, config, save_config_meth
             config (dict): Configuration dictionary.
             save_config_method (function): Method to save the configuration.
         """
-        print("\nDo you want to use the default configuration or provide custom settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom settings")
         config_choice = input("Enter your choice (1-2): ").strip()
 
-        if config_choice == '1':
+        if config_choice == "1":
             # Use default configurations
             model_name = "sentence-transformers/all-MiniLM-L6-v2"
             model_payload = {
                 "name": f"huggingface_{model_name.split('/')[-1]}",
                 "model_format": "TORCH_SCRIPT",
                 "model_config": {
-                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "embedding_dimension": config.get("embedding_dimension", 768),
                     "framework_type": "SENTENCE_TRANSFORMERS",
                     "model_type": "bert",
-                    "embedding_model": model_name
+                    "embedding_model": model_name,
                 },
-                "description": f"Hugging Face Transformers model: {model_name}"
+                "description": f"Hugging Face Transformers model: {model_name}",
             }
-        elif config_choice == '2':
+        elif config_choice == "2":
             # Get custom configurations
-            model_name = input("Enter the Hugging Face model ID (e.g., 'sentence-transformers/all-MiniLM-L6-v2'): ").strip()
+            model_name = input(
+                "Enter the Hugging Face model ID (e.g., 'sentence-transformers/all-MiniLM-L6-v2'): "
+            ).strip()
             if not model_name:
                 print(f"{Fore.RED}Model ID is required. Aborting.{Style.RESET_ALL}")
                 return
@@ -67,47 +80,54 @@ def register_huggingface_model(self, opensearch_client, config, save_config_meth
                 "name": f"huggingface_{model_name.split('/')[-1]}",
                 "model_format": "TORCH_SCRIPT",
                 "model_config": {
-                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "embedding_dimension": config.get("embedding_dimension", 768),
                     "framework_type": "SENTENCE_TRANSFORMERS",
                     "model_type": "bert",
-                    "embedding_model": model_name
+                    "embedding_model": model_name,
                 },
-                "description": f"Hugging Face Transformers model: {model_name}"
+                "description": f"Hugging Face Transformers model: {model_name}",
             }
             print(json.dumps(example_payload, indent=2))
-            
+
             model_payload = self.get_custom_json_input()
             if not model_payload:
                 return
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return
 
         # Register the model
         try:
             response = opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
+                method="POST", url="/_plugins/_ml/models/_register", body=model_payload
             )
-            task_id = response.get('task_id')
+            task_id = response.get("task_id")
             if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}"
+                )
                 # Wait for the task to complete and retrieve the model_id
                 model_id = self.wait_for_model_registration(opensearch_client, task_id)
                 if model_id:
                     # Deploy the model
-                    deploy_response = opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    opensearch_client.transport.perform_request(
+                        method="POST", url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(
+                        f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}"
                     )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    config['embedding_model_id'] = model_id
+                    config["embedding_model_id"] = model_id
                     save_config_method(config)
                 else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}"
+                    )
             else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}"
+                )
         except Exception as ex:
             print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
 
@@ -120,7 +140,9 @@ def get_custom_json_input(self):
             print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
             return None
 
-    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+    def wait_for_model_registration(
+        self, opensearch_client, task_id, timeout=600, interval=10
+    ):
         """
         Wait for the model registration task to complete and return the model_id.
 
@@ -137,21 +159,26 @@ def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, i
         while time.time() < end_time:
             try:
                 response = opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
+                    method="GET", url=f"/_plugins/_ml/tasks/{task_id}"
                 )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
+                state = response.get("state")
+                if state == "COMPLETED":
+                    model_id = response.get("model_id")
                     return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                elif state in ["FAILED", "STOPPED"]:
+                    print(
+                        f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}"
+                    )
                     return None
                 else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    print(
+                        f"Model registration task {task_id} is in state: {state}. Waiting..."
+                    )
                     time.sleep(interval)
             except Exception as ex:
                 print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
                 time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
\ No newline at end of file
+        print(
+            f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}"
+        )
+        return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
index 951e0f50..41707a29 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/OpenAIModel.py
@@ -4,15 +4,25 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
+
 import json
-from colorama import Fore, Style
 import time
 
+from colorama import Fore, Style
+
+
 class OpenAIModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the OpenAIModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -37,7 +47,7 @@ def register_openai_model(self, helper, config, save_config_method):
         """
         # Prompt for necessary inputs
         secret_name = input("Enter a name for the AWS Secrets Manager secret: ")
-        secret_key = 'openai_api_key'
+        secret_key = "openai_api_key"
         openai_api_key = input("Enter your OpenAI API key: ")
         secret_value = {secret_key: openai_api_key}
 
@@ -50,9 +60,7 @@ def register_openai_model(self, helper, config, save_config_method):
             "description": "Connector for OpenAI embedding model",
             "version": "1.0",
             "protocol": "http",
-            "parameters": {
-                "model": "text-embedding-ada-002"
-            },
+            "parameters": {"model": "text-embedding-ada-002"},
             "actions": [
                 {
                     "action_type": "predict",
@@ -60,13 +68,13 @@ def register_openai_model(self, helper, config, save_config_method):
                     "url": "https://api.openai.com/v1/embeddings",
                     "headers": {
                         "Authorization": f"Bearer ${{credential.secretArn.{secret_key}}}",
-                        "Content-Type": "application/json"
+                        "Content-Type": "application/json",
                     },
-                    "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                    "request_body": '{ "input": ${parameters.input}, "model": "${parameters.model}" }',
                     "pre_process_function": "connector.pre_process.openai.embedding",
-                    "post_process_function": "connector.post_process.openai.embedding"
+                    "post_process_function": "connector.post_process.openai.embedding",
                 }
-            ]
+            ],
         }
 
         # Get model details from user
@@ -81,7 +89,7 @@ def register_openai_model(self, helper, config, save_config_method):
             connector_role_name,
             create_connector_role_name,
             create_connector_input,
-            sleep_time_in_seconds=10
+            sleep_time_in_seconds=10,
         )
 
         if not connector_id:
@@ -89,20 +97,28 @@ def register_openai_model(self, helper, config, save_config_method):
             return
 
         # Register model
-        model_name = create_connector_input.get('name', 'OpenAI embedding model')
-        description = create_connector_input.get('description', 'OpenAI embedding model for semantic search')
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+        model_name = create_connector_input.get("name", "OpenAI embedding model")
+        description = create_connector_input.get(
+            "description", "OpenAI embedding model for semantic search"
+        )
+        model_id = helper.create_model(
+            model_name, description, connector_id, create_connector_role_name
+        )
 
         if not model_id:
             print(f"{Fore.RED}Failed to create model. Aborting.{Style.RESET_ALL}")
             return
 
         # Save model_id to config
-        config['embedding_model_id'] = model_id
+        config["embedding_model_id"] = model_id
         save_config_method(config)
-        print(f"{Fore.GREEN}OpenAI model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
+        print(
+            f"{Fore.GREEN}OpenAI model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}"
+        )
 
-    def register_openai_model_opensource(self, opensearch_client, config, save_config_method):
+    def register_openai_model_opensource(
+        self, opensearch_client, config, save_config_method
+    ):
         """
         Register an OpenAI embedding model in open-source OpenSearch.
 
@@ -116,24 +132,22 @@ def register_openai_model_opensource(self, opensearch_client, config, save_confi
             print(f"{Fore.RED}API key is required. Aborting.{Style.RESET_ALL}")
             return
 
-        print("\nDo you want to use the default configuration or provide custom settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom settings")
         config_choice = input("Enter your choice (1-2): ").strip()
 
-        if config_choice == '1':
+        if config_choice == "1":
             # Use default configurations
             connector_payload = {
                 "name": "OpenAI Embedding Connector",
                 "description": "Connector for OpenAI embedding model",
                 "version": "1",
                 "protocol": "http",
-                "parameters": {
-                    "model": "text-embedding-ada-002"
-                },
-                "credential": {
-                    "openAI_key": openai_api_key
-                },
+                "parameters": {"model": "text-embedding-ada-002"},
+                "credential": {"openAI_key": openai_api_key},
                 "actions": [
                     {
                         "action_type": "predict",
@@ -141,19 +155,19 @@ def register_openai_model_opensource(self, opensearch_client, config, save_confi
                         "url": "https://api.openai.com/v1/embeddings",
                         "headers": {
                             "Authorization": "Bearer ${credential.openAI_key}",
-                            "Content-Type": "application/json"
+                            "Content-Type": "application/json",
                         },
-                        "request_body": "{ \"input\": ${parameters.input}, \"model\": \"${parameters.model}\" }",
+                        "request_body": '{ "input": ${parameters.input}, "model": "${parameters.model}" }',
                         "pre_process_function": "connector.pre_process.openai.embedding",
-                        "post_process_function": "connector.post_process.openai.embedding"
+                        "post_process_function": "connector.post_process.openai.embedding",
                     }
-                ]
+                ],
             }
             model_group_payload = {
                 "name": f"openai_model_group_{int(time.time())}",
-                "description": "Model group for OpenAI models"
+                "description": "Model group for OpenAI models",
             }
-        elif config_choice == '2':
+        elif config_choice == "2":
             # Get custom configurations
             print("\nPlease enter your connector details as a JSON object.")
             connector_payload = self.get_custom_json_input()
@@ -165,7 +179,9 @@ def register_openai_model_opensource(self, opensearch_client, config, save_confi
             if not model_group_payload:
                 return
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return
 
         # Register the connector
@@ -173,13 +189,17 @@ def register_openai_model_opensource(self, opensearch_client, config, save_confi
             connector_response = opensearch_client.transport.perform_request(
                 method="POST",
                 url="/_plugins/_ml/connectors/_create",
-                body=connector_payload
+                body=connector_payload,
             )
-            connector_id = connector_response.get('connector_id')
+            connector_id = connector_response.get("connector_id")
             if not connector_id:
-                print(f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to register connector. Response: {connector_response}{Style.RESET_ALL}"
+                )
                 return
-            print(f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}")
+            print(
+                f"{Fore.GREEN}Connector registered successfully. Connector ID: {connector_id}{Style.RESET_ALL}"
+            )
         except Exception as ex:
             print(f"{Fore.RED}Error registering connector: {ex}{Style.RESET_ALL}")
             return
@@ -189,55 +209,70 @@ def register_openai_model_opensource(self, opensearch_client, config, save_confi
             model_group_response = opensearch_client.transport.perform_request(
                 method="POST",
                 url="/_plugins/_ml/model_groups/_register",
-                body=model_group_payload
+                body=model_group_payload,
             )
-            model_group_id = model_group_response.get('model_group_id')
+            model_group_id = model_group_response.get("model_group_id")
             if not model_group_id:
-                print(f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to create model group. Response: {model_group_response}{Style.RESET_ALL}"
+                )
                 return
-            print(f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}")
+            print(
+                f"{Fore.GREEN}Model group created successfully. Model Group ID: {model_group_id}{Style.RESET_ALL}"
+            )
         except Exception as ex:
             print(f"{Fore.RED}Error creating model group: {ex}{Style.RESET_ALL}")
-            if 'illegal_argument_exception' in str(ex) and 'already being used' in str(ex):
-                print(f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}")
-                model_group_id = str(ex).split('ID: ')[-1].strip("'.")
+            if "illegal_argument_exception" in str(ex) and "already being used" in str(
+                ex
+            ):
+                print(
+                    f"{Fore.YELLOW}A model group with this name already exists. Using the existing group.{Style.RESET_ALL}"
+                )
+                model_group_id = str(ex).split("ID: ")[-1].strip("'.")
             else:
                 return
 
         # Create model payload
         model_payload = {
-            "name": connector_payload.get('name', 'OpenAI embedding model'),
+            "name": connector_payload.get("name", "OpenAI embedding model"),
             "function_name": "REMOTE",
             "model_group_id": model_group_id,
-            "description": connector_payload.get('description', 'OpenAI embedding model for semantic search'),
-            "connector_id": connector_id
+            "description": connector_payload.get(
+                "description", "OpenAI embedding model for semantic search"
+            ),
+            "connector_id": connector_id,
         }
 
         # Register the model
         try:
             response = opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
+                method="POST", url="/_plugins/_ml/models/_register", body=model_payload
             )
-            task_id = response.get('task_id')
+            task_id = response.get("task_id")
             if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}"
+                )
                 # Wait for the task to complete and retrieve the model_id
                 model_id = self.wait_for_model_registration(opensearch_client, task_id)
                 if model_id:
                     # Deploy the model
-                    deploy_response = opensearch_client.transport.perform_request(
-                        method="POST",
-                        url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    opensearch_client.transport.perform_request(
+                        method="POST", url=f"/_plugins/_ml/models/{model_id}/_deploy"
+                    )
+                    print(
+                        f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}"
                     )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {model_id}{Style.RESET_ALL}")
-                    config['embedding_model_id'] = model_id
+                    config["embedding_model_id"] = model_id
                     save_config_method(config)
                 else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}"
+                    )
             else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}"
+                )
         except Exception as ex:
             print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
 
@@ -252,14 +287,16 @@ def get_custom_model_details(self, default_input):
         Returns:
             dict or None: Custom or default model configuration, or None if invalid input.
         """
-        print("\nDo you want to use the default configuration or provide custom model settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom model settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom model settings")
         choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
+        if choice == "1":
             return default_input
-        elif choice == '2':
+        elif choice == "2":
             print("Please enter your model details as a JSON object.")
             print("Example:")
             print(json.dumps(default_input, indent=2))
@@ -271,7 +308,9 @@ def get_custom_model_details(self, default_input):
                 print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
                 return None
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return None
 
     def get_custom_json_input(self):
@@ -283,7 +322,9 @@ def get_custom_json_input(self):
             print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
             return None
 
-    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+    def wait_for_model_registration(
+        self, opensearch_client, task_id, timeout=600, interval=10
+    ):
         """
         Wait for the model registration task to complete and return the model_id.
 
@@ -300,21 +341,26 @@ def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, i
         while time.time() < end_time:
             try:
                 response = opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
+                    method="GET", url=f"/_plugins/_ml/tasks/{task_id}"
                 )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
+                state = response.get("state")
+                if state == "COMPLETED":
+                    model_id = response.get("model_id")
                     return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                elif state in ["FAILED", "STOPPED"]:
+                    print(
+                        f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}"
+                    )
                     return None
                 else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    print(
+                        f"Model registration task {task_id} is in state: {state}. Waiting..."
+                    )
                     time.sleep(interval)
             except Exception as ex:
                 print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
                 time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
\ No newline at end of file
+        print(
+            f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}"
+        )
+        return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
index 4485d2c0..98c1278f 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/PyTorchModel.py
@@ -5,15 +5,24 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 import json
-from colorama import Fore, Style
 import os
 import time
 
+from colorama import Fore, Style
+
+
 class CustomPyTorchModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the CustomPyTorchModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -27,7 +36,9 @@ def __init__(self, aws_region, opensearch_domain_name, opensearch_username, open
         self.opensearch_password = opensearch_password
         self.iam_role_helper = iam_role_helper
 
-    def register_custom_pytorch_model(self, opensearch_client, config, save_config_method):
+    def register_custom_pytorch_model(
+        self, opensearch_client, config, save_config_method
+    ):
         """
         Register a custom PyTorch embedding model in open-source OpenSearch.
 
@@ -36,34 +47,44 @@ def register_custom_pytorch_model(self, opensearch_client, config, save_config_m
             config (dict): Configuration dictionary.
             save_config_method (function): Method to save the configuration.
         """
-        print("\nDo you want to use the default configuration or provide custom settings?")
+        print(
+            "\nDo you want to use the default configuration or provide custom settings?"
+        )
         print("1. Use default configuration")
         print("2. Provide custom settings")
         config_choice = input("Enter your choice (1-2): ").strip()
 
-        if config_choice == '1':
+        if config_choice == "1":
             # Use default configurations
-            model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+            model_path = input(
+                "Enter the path to your PyTorch model file (.pt or .pth): "
+            ).strip()
             if not os.path.isfile(model_path):
-                print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}"
+                )
                 return
 
-            model_name = os.path.basename(model_path).split('.')[0]
+            model_name = os.path.basename(model_path).split(".")[0]
             model_payload = {
                 "name": f"custom_pytorch_{model_name}",
                 "model_format": "TORCH_SCRIPT",
                 "model_config": {
-                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "embedding_dimension": config.get("embedding_dimension", 768),
                     "framework_type": "CUSTOM",
-                    "model_type": "bert"
+                    "model_type": "bert",
                 },
-                "description": f"Custom PyTorch model: {model_name}"
+                "description": f"Custom PyTorch model: {model_name}",
             }
-        elif config_choice == '2':
+        elif config_choice == "2":
             # Get custom configurations
-            model_path = input("Enter the path to your PyTorch model file (.pt or .pth): ").strip()
+            model_path = input(
+                "Enter the path to your PyTorch model file (.pt or .pth): "
+            ).strip()
             if not os.path.isfile(model_path):
-                print(f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Model file not found at '{model_path}'. Aborting.{Style.RESET_ALL}"
+                )
                 return
 
             print("\nPlease enter your model details as a JSON object.")
@@ -72,71 +93,85 @@ def register_custom_pytorch_model(self, opensearch_client, config, save_config_m
                 "name": "custom_pytorch_model",
                 "model_format": "TORCH_SCRIPT",
                 "model_config": {
-                    "embedding_dimension": config.get('embedding_dimension', 768),
+                    "embedding_dimension": config.get("embedding_dimension", 768),
                     "framework_type": "CUSTOM",
-                    "model_type": "bert"
+                    "model_type": "bert",
                 },
-                "description": "Custom PyTorch model for semantic search"
+                "description": "Custom PyTorch model for semantic search",
             }
             print(json.dumps(example_payload, indent=2))
-            
+
             model_payload = self.get_custom_json_input()
             if not model_payload:
                 return
         else:
-            print(f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Aborting model registration.{Style.RESET_ALL}"
+            )
             return
 
         # Upload the model file to OpenSearch
         try:
-            with open(model_path, 'rb') as f:
+            with open(model_path, "rb") as f:
                 model_content = f.read()
 
             # Use the ML plugin's model upload API
             upload_response = opensearch_client.transport.perform_request(
                 method="POST",
                 url="/_plugins/_ml/models/_upload",
-                params={"model_name": model_payload['name']},
+                params={"model_name": model_payload["name"]},
                 body=model_content,
-                headers={'Content-Type': 'application/octet-stream'}
+                headers={"Content-Type": "application/octet-stream"},
             )
-            if 'model_id' not in upload_response:
-                print(f"{Fore.RED}Failed to upload model. Response: {upload_response}{Style.RESET_ALL}")
+            if "model_id" not in upload_response:
+                print(
+                    f"{Fore.RED}Failed to upload model. Response: {upload_response}{Style.RESET_ALL}"
+                )
                 return
-            model_id = upload_response['model_id']
-            print(f"{Fore.GREEN}Model uploaded successfully. Model ID: {model_id}{Style.RESET_ALL}")
+            model_id = upload_response["model_id"]
+            print(
+                f"{Fore.GREEN}Model uploaded successfully. Model ID: {model_id}{Style.RESET_ALL}"
+            )
         except Exception as ex:
             print(f"{Fore.RED}Error uploading model: {ex}{Style.RESET_ALL}")
             return
 
         # Add the model_id to the payload
-        model_payload['model_id'] = model_id
+        model_payload["model_id"] = model_id
 
         # Register the model
         try:
             response = opensearch_client.transport.perform_request(
-                method="POST",
-                url="/_plugins/_ml/models/_register",
-                body=model_payload
+                method="POST", url="/_plugins/_ml/models/_register", body=model_payload
             )
-            task_id = response.get('task_id')
+            task_id = response.get("task_id")
             if task_id:
-                print(f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Model registration initiated. Task ID: {task_id}{Style.RESET_ALL}"
+                )
                 # Wait for the task to complete and retrieve the model_id
-                registered_model_id = self.wait_for_model_registration(opensearch_client, task_id)
+                registered_model_id = self.wait_for_model_registration(
+                    opensearch_client, task_id
+                )
                 if registered_model_id:
                     # Deploy the model
-                    deploy_response = opensearch_client.transport.perform_request(
+                    opensearch_client.transport.perform_request(
                         method="POST",
-                        url=f"/_plugins/_ml/models/{registered_model_id}/_deploy"
+                        url=f"/_plugins/_ml/models/{registered_model_id}/_deploy",
+                    )
+                    print(
+                        f"{Fore.GREEN}Model deployed successfully. Model ID: {registered_model_id}{Style.RESET_ALL}"
                     )
-                    print(f"{Fore.GREEN}Model deployed successfully. Model ID: {registered_model_id}{Style.RESET_ALL}")
-                    config['embedding_model_id'] = registered_model_id
+                    config["embedding_model_id"] = registered_model_id
                     save_config_method(config)
                 else:
-                    print(f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Model registration failed or timed out.{Style.RESET_ALL}"
+                    )
             else:
-                print(f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to initiate model registration. Response: {response}{Style.RESET_ALL}"
+                )
         except Exception as ex:
             print(f"{Fore.RED}Error registering model: {ex}{Style.RESET_ALL}")
 
@@ -149,7 +184,9 @@ def get_custom_json_input(self):
             print(f"{Fore.RED}Invalid JSON input: {e}{Style.RESET_ALL}")
             return None
 
-    def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, interval=10):
+    def wait_for_model_registration(
+        self, opensearch_client, task_id, timeout=600, interval=10
+    ):
         """
         Wait for the model registration task to complete and return the model_id.
 
@@ -166,21 +203,26 @@ def wait_for_model_registration(self, opensearch_client, task_id, timeout=600, i
         while time.time() < end_time:
             try:
                 response = opensearch_client.transport.perform_request(
-                    method="GET",
-                    url=f"/_plugins/_ml/tasks/{task_id}"
+                    method="GET", url=f"/_plugins/_ml/tasks/{task_id}"
                 )
-                state = response.get('state')
-                if state == 'COMPLETED':
-                    model_id = response.get('model_id')
+                state = response.get("state")
+                if state == "COMPLETED":
+                    model_id = response.get("model_id")
                     return model_id
-                elif state in ['FAILED', 'STOPPED']:
-                    print(f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}")
+                elif state in ["FAILED", "STOPPED"]:
+                    print(
+                        f"{Fore.RED}Model registration task {task_id} failed with state: {state}{Style.RESET_ALL}"
+                    )
                     return None
                 else:
-                    print(f"Model registration task {task_id} is in state: {state}. Waiting...")
+                    print(
+                        f"Model registration task {task_id} is in state: {state}. Waiting..."
+                    )
                     time.sleep(interval)
             except Exception as ex:
                 print(f"{Fore.RED}Error checking task status: {ex}{Style.RESET_ALL}")
                 time.sleep(interval)
-        print(f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}")
-        return None
\ No newline at end of file
+        print(
+            f"{Fore.RED}Timed out waiting for model registration to complete.{Style.RESET_ALL}"
+        )
+        return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
index 60252e66..353e4567 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/SageMakerModel.py
@@ -4,14 +4,22 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-import json
+
 from colorama import Fore, Style
 
+
 class SageMakerModel:
-    def __init__(self, aws_region, opensearch_domain_name, opensearch_username, opensearch_password, iam_role_helper):
+    def __init__(
+        self,
+        aws_region,
+        opensearch_domain_name,
+        opensearch_username,
+        opensearch_password,
+        iam_role_helper,
+    ):
         """
         Initializes the SageMakerModel with necessary configurations.
-        
+
         Args:
             aws_region (str): AWS region.
             opensearch_domain_name (str): OpenSearch domain name.
@@ -35,9 +43,16 @@ def register_sagemaker_model(self, helper, config, save_config_method):
             save_config_method (function): Method to save the configuration.
         """
         # Prompt for necessary inputs
-        sagemaker_endpoint_arn = input("Enter your SageMaker inference endpoint ARN: ").strip()
-        sagemaker_endpoint_url = input("Enter your SageMaker inference endpoint URL: ").strip()
-        sagemaker_region = input(f"Enter your SageMaker region [{self.aws_region}]: ").strip() or self.aws_region
+        sagemaker_endpoint_arn = input(
+            "Enter your SageMaker inference endpoint ARN: "
+        ).strip()
+        sagemaker_endpoint_url = input(
+            "Enter your SageMaker inference endpoint URL: "
+        ).strip()
+        sagemaker_region = (
+            input(f"Enter your SageMaker region [{self.aws_region}]: ").strip()
+            or self.aws_region
+        )
         connector_role_name = "my_test_sagemaker_connector_role"
         create_connector_role_name = "my_test_create_sagemaker_connector_role"
 
@@ -48,9 +63,9 @@ def register_sagemaker_model(self, helper, config, save_config_method):
                 {
                     "Action": ["sagemaker:InvokeEndpoint"],
                     "Effect": "Allow",
-                    "Resource": sagemaker_endpoint_arn
+                    "Resource": sagemaker_endpoint_arn,
                 }
-            ]
+            ],
         }
 
         # Create connector input
@@ -59,23 +74,18 @@ def register_sagemaker_model(self, helper, config, save_config_method):
             "description": "Connector for SageMaker embedding model",
             "version": "1.0",
             "protocol": "aws_sigv4",
-            "parameters": {
-                "region": sagemaker_region,
-                "service_name": "sagemaker"
-            },
+            "parameters": {"region": sagemaker_region, "service_name": "sagemaker"},
             "actions": [
                 {
                     "action_type": "predict",
                     "method": "POST",
-                    "headers": {
-                        "Content-Type": "application/json"
-                    },
+                    "headers": {"Content-Type": "application/json"},
                     "url": sagemaker_endpoint_url,
                     "request_body": "${parameters.input}",
                     "pre_process_function": "connector.pre_process.default.embedding",
-                    "post_process_function": "connector.post_process.default.embedding"
+                    "post_process_function": "connector.post_process.default.embedding",
                 }
-            ]
+            ],
         }
 
         # Create connector
@@ -84,23 +94,31 @@ def register_sagemaker_model(self, helper, config, save_config_method):
             connector_role_name,
             create_connector_role_name,
             create_connector_input,
-            sleep_time_in_seconds=10
+            sleep_time_in_seconds=10,
         )
 
         if not connector_id:
-            print(f"{Fore.RED}Failed to create SageMaker connector. Aborting.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to create SageMaker connector. Aborting.{Style.RESET_ALL}"
+            )
             return
 
         # Register model
         model_name = "SageMaker Embedding Model"
         description = "SageMaker embedding model for semantic search"
-        model_id = helper.create_model(model_name, description, connector_id, create_connector_role_name)
+        model_id = helper.create_model(
+            model_name, description, connector_id, create_connector_role_name
+        )
 
         if not model_id:
-            print(f"{Fore.RED}Failed to create SageMaker model. Aborting.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to create SageMaker model. Aborting.{Style.RESET_ALL}"
+            )
             return
 
         # Save model_id to config
-        config['embedding_model_id'] = model_id
+        config["embedding_model_id"] = model_id
         save_config_method(config)
-        print(f"{Fore.GREEN}SageMaker model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}")
\ No newline at end of file
+        print(
+            f"{Fore.GREEN}SageMaker model registered successfully. Model ID '{model_id}' saved in configuration.{Style.RESET_ALL}"
+        )
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
index 43d9d3f4..3a3fa0f8 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/ml_models/__init__.py
@@ -3,4 +3,11 @@
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
\ No newline at end of file
+# GitHub history for details.
+
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
index c442e98b..02fae550 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/model_register.py
@@ -6,20 +6,31 @@
 # GitHub history for details.
 
 
-import os
-import json
+import sys
 import time
+
 import boto3
-from urllib.parse import urlparse
 from colorama import Fore, Style, init
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
+
 from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import BedrockModel
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import OpenAIModel
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import CohereModel
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.HuggingFaceModel import HuggingFaceModel
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import CustomPyTorchModel
-import sys
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import (
+    AIConnectorHelper,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import (
+    BedrockModel,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import (
+    CohereModel,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.HuggingFaceModel import (
+    HuggingFaceModel,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import (
+    OpenAIModel,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import (
+    CustomPyTorchModel,
+)
 
 # Initialize colorama for colored terminal output
 init(autoreset=True)
@@ -40,15 +51,15 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
         :param opensearch_domain_name: Name of the OpenSearch domain.
         """
         self.config = config
-        self.aws_region = config.get('region')
+        self.aws_region = config.get("region")
         self.opensearch_client = opensearch_client
         self.opensearch_domain_name = opensearch_domain_name
-        self.opensearch_endpoint = config.get('opensearch_endpoint')
-        self.opensearch_username = config.get('opensearch_username')
-        self.opensearch_password = config.get('opensearch_password')
-        self.iam_principal = config.get('iam_principal')
-        self.embedding_dimension = int(config.get('embedding_dimension', 768))
-        self.service_type = config.get('service_type', 'managed')
+        self.opensearch_endpoint = config.get("opensearch_endpoint")
+        self.opensearch_username = config.get("opensearch_username")
+        self.opensearch_password = config.get("opensearch_password")
+        self.iam_principal = config.get("iam_principal")
+        self.embedding_dimension = int(config.get("embedding_dimension", 768))
+        self.service_type = config.get("service_type", "managed")
 
         # Initialize IAMRoleHelper with necessary parameters
         self.iam_role_helper = IAMRoleHelper(
@@ -56,11 +67,11 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.iam_principal
+            self.iam_principal,
         )
 
         # Initialize AWS clients if the service type is not open-source
-        if self.service_type != 'open-source':
+        if self.service_type != "open-source":
             self.initialize_clients()
 
         # Initialize instances of different model providers
@@ -69,35 +80,35 @@ def __init__(self, config, opensearch_client, opensearch_domain_name):
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_username=self.opensearch_username,
             opensearch_password=self.opensearch_password,
-            iam_role_helper=self.iam_role_helper
+            iam_role_helper=self.iam_role_helper,
         )
         self.openai_model = OpenAIModel(
             aws_region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_username=self.opensearch_username,
             opensearch_password=self.opensearch_password,
-            iam_role_helper=self.iam_role_helper
+            iam_role_helper=self.iam_role_helper,
         )
         self.cohere_model = CohereModel(
             aws_region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_username=self.opensearch_username,
             opensearch_password=self.opensearch_password,
-            iam_role_helper=self.iam_role_helper
+            iam_role_helper=self.iam_role_helper,
         )
         self.huggingface_model = HuggingFaceModel(
             aws_region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_username=self.opensearch_username,
             opensearch_password=self.opensearch_password,
-            iam_role_helper=self.iam_role_helper
+            iam_role_helper=self.iam_role_helper,
         )
         self.custom_pytorch_model = CustomPyTorchModel(
             aws_region=self.aws_region,
             opensearch_domain_name=self.opensearch_domain_name,
             opensearch_username=self.opensearch_username,
             opensearch_password=self.opensearch_password,
-            iam_role_helper=self.iam_role_helper
+            iam_role_helper=self.iam_role_helper,
         )
 
     def initialize_clients(self) -> bool:
@@ -106,10 +117,12 @@ def initialize_clients(self) -> bool:
 
         :return: True if clients are initialized successfully, False otherwise.
         """
-        if self.service_type in ['managed', 'serverless']:
+        if self.service_type in ["managed", "serverless"]:
             try:
                 # Initialize Bedrock client for managed services
-                self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+                self.bedrock_client = boto3.client(
+                    "bedrock-runtime", region_name=self.aws_region
+                )
                 # Add any other clients initialization if needed
                 time.sleep(7)  # Wait for client initialization
                 print("AWS clients initialized successfully.")
@@ -130,19 +143,25 @@ def prompt_model_registration(self):
         print("2. Use an existing embedding model ID")
         choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
+        if choice == "1":
             self.register_model_interactive()
-        elif choice == '2':
+        elif choice == "2":
             model_id = input("Please enter your existing embedding model ID: ").strip()
             if model_id:
-                self.config['embedding_model_id'] = model_id
+                self.config["embedding_model_id"] = model_id
                 self.save_config(self.config)
-                print(f"{Fore.GREEN}Model ID '{model_id}' saved successfully in configuration.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Model ID '{model_id}' saved successfully in configuration.{Style.RESET_ALL}"
+                )
             else:
-                print(f"{Fore.RED}No model ID provided. Cannot proceed without an embedding model.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}No model ID provided. Cannot proceed without an embedding model.{Style.RESET_ALL}"
+                )
                 sys.exit(1)  # Exit the setup as we cannot proceed without a model ID
         else:
-            print(f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Please run setup again and select a valid option.{Style.RESET_ALL}"
+            )
             sys.exit(1)  # Exit the setup as we cannot proceed without a valid choice
 
     def save_config(self, config):
@@ -152,9 +171,10 @@ def save_config(self, config):
         :param config: Configuration dictionary to save.
         """
         import configparser
+
         parser = configparser.ConfigParser()
-        parser['DEFAULT'] = config
-        with open('config.ini', 'w') as f:
+        parser["DEFAULT"] = config
+        with open("config.ini", "w") as f:
             parser.write(f)
 
     def register_model_interactive(self):
@@ -163,16 +183,22 @@ def register_model_interactive(self):
         """
         # Initialize clients
         if not self.initialize_clients():
-            print(f"{Fore.RED}Failed to initialize AWS clients. Cannot proceed.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to initialize AWS clients. Cannot proceed.{Style.RESET_ALL}"
+            )
             return
 
         # Ensure opensearch_endpoint is set
-        if not self.config.get('opensearch_endpoint'):
-            print(f"{Fore.RED}OpenSearch endpoint not set. Please run 'setup' command first.{Style.RESET_ALL}")
+        if not self.config.get("opensearch_endpoint"):
+            print(
+                f"{Fore.RED}OpenSearch endpoint not set. Please run 'setup' command first.{Style.RESET_ALL}"
+            )
             return
 
         # Extract the IAM user name from the IAM principal ARN
-        aws_user_name = self.iam_role_helper.get_iam_user_name_from_arn(self.iam_principal)
+        aws_user_name = self.iam_role_helper.get_iam_user_name_from_arn(
+            self.iam_principal
+        )
 
         if not aws_user_name:
             print("Could not extract IAM user name from IAM principal ARN.")
@@ -187,7 +213,7 @@ def register_model_interactive(self):
             opensearch_domain_password=self.opensearch_password,
             aws_user_name=aws_user_name,
             aws_role_name=None,  # Set to None or provide if applicable
-            opensearch_domain_url=self.opensearch_endpoint  # Pass the endpoint from config
+            opensearch_domain_url=self.opensearch_endpoint,  # Pass the endpoint from config
         )
 
         # Prompt user to select a model
@@ -200,30 +226,50 @@ def register_model_interactive(self):
         model_choice = input("Enter your choice (1-5): ")
 
         # Call the appropriate method based on the user's choice
-        if model_choice == '1':
-            self.bedrock_model.register_bedrock_model(helper, self.config, self.save_config)
-        elif model_choice == '2':
-            if self.service_type != 'open-source':
-                self.openai_model.register_openai_model(helper, self.config, self.save_config)
+        if model_choice == "1":
+            self.bedrock_model.register_bedrock_model(
+                helper, self.config, self.save_config
+            )
+        elif model_choice == "2":
+            if self.service_type != "open-source":
+                self.openai_model.register_openai_model(
+                    helper, self.config, self.save_config
+                )
             else:
-                self.openai_model.register_openai_model_opensource(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '3':
-            if self.service_type != 'open-source':
-                self.cohere_model.register_cohere_model(helper, self.config, self.save_config)
+                self.openai_model.register_openai_model_opensource(
+                    self.opensearch_client, self.config, self.save_config
+                )
+        elif model_choice == "3":
+            if self.service_type != "open-source":
+                self.cohere_model.register_cohere_model(
+                    helper, self.config, self.save_config
+                )
             else:
-                self.cohere_model.register_cohere_model_opensource(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '4':
-            if self.service_type != 'open-source':
-                print(f"{Fore.RED}Hugging Face Transformers models are only supported in open-source OpenSearch.{Style.RESET_ALL}")
+                self.cohere_model.register_cohere_model_opensource(
+                    self.opensearch_client, self.config, self.save_config
+                )
+        elif model_choice == "4":
+            if self.service_type != "open-source":
+                print(
+                    f"{Fore.RED}Hugging Face Transformers models are only supported in open-source OpenSearch.{Style.RESET_ALL}"
+                )
             else:
-                self.huggingface_model.register_huggingface_model(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '5':
-            if self.service_type != 'open-source':
-                print(f"{Fore.RED}Custom PyTorch models are only supported in open-source OpenSearch.{Style.RESET_ALL}")
+                self.huggingface_model.register_huggingface_model(
+                    self.opensearch_client, self.config, self.save_config
+                )
+        elif model_choice == "5":
+            if self.service_type != "open-source":
+                print(
+                    f"{Fore.RED}Custom PyTorch models are only supported in open-source OpenSearch.{Style.RESET_ALL}"
+                )
             else:
-                self.custom_pytorch_model.register_custom_pytorch_model(self.opensearch_client, self.config, self.save_config)
+                self.custom_pytorch_model.register_custom_pytorch_model(
+                    self.opensearch_client, self.config, self.save_config
+                )
         else:
-            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}"
+            )
             return
 
     def prompt_opensource_model_registration(self):
@@ -235,12 +281,16 @@ def prompt_opensource_model_registration(self):
         print("2. No, I will register the model later")
         choice = input("Enter your choice (1-2): ").strip()
 
-        if choice == '1':
+        if choice == "1":
             self.register_model_opensource_interactive()
-        elif choice == '2':
-            print("Skipping model registration. You can register models later using the appropriate commands.")
+        elif choice == "2":
+            print(
+                "Skipping model registration. You can register models later using the appropriate commands."
+            )
         else:
-            print(f"{Fore.RED}Invalid choice. Skipping model registration.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Invalid choice. Skipping model registration.{Style.RESET_ALL}"
+            )
 
     def register_model_opensource_interactive(self):
         """
@@ -248,7 +298,9 @@ def register_model_opensource_interactive(self):
         """
         # Ensure OpenSearch client is initialized
         if not self.opensearch_client:
-            print(f"{Fore.RED}OpenSearch client is not initialized. Please run setup again.{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}OpenSearch client is not initialized. Please run setup again.{Style.RESET_ALL}"
+            )
             return
 
         # Prompt user to select a model
@@ -259,14 +311,24 @@ def register_model_opensource_interactive(self):
         print("4. Custom PyTorch Model")
         model_choice = input("Enter your choice (1-4): ")
 
-        if model_choice == '1':
-            self.openai_model.register_openai_model_opensource(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '2':
-            self.cohere_model.register_cohere_model_opensource(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '3':
-            self.huggingface_model.register_huggingface_model(self.opensearch_client, self.config, self.save_config)
-        elif model_choice == '4':
-            self.custom_pytorch_model.register_custom_pytorch_model(self.opensearch_client, self.config, self.save_config)
+        if model_choice == "1":
+            self.openai_model.register_openai_model_opensource(
+                self.opensearch_client, self.config, self.save_config
+            )
+        elif model_choice == "2":
+            self.cohere_model.register_cohere_model_opensource(
+                self.opensearch_client, self.config, self.save_config
+            )
+        elif model_choice == "3":
+            self.huggingface_model.register_huggingface_model(
+                self.opensearch_client, self.config, self.save_config
+            )
+        elif model_choice == "4":
+            self.custom_pytorch_model.register_custom_pytorch_model(
+                self.opensearch_client, self.config, self.save_config
+            )
         else:
-            print(f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}")
-            return
\ No newline at end of file
+            print(
+                f"{Fore.RED}Invalid choice. Exiting model registration.{Style.RESET_ALL}"
+            )
+            return
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
index 912720e5..20399b4d 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/opensearch_connector.py
@@ -5,9 +5,11 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth, exceptions as opensearch_exceptions
-import boto3
 from urllib.parse import urlparse
+
+import boto3
+from opensearchpy import AWSV4SignerAuth, OpenSearch, RequestsHttpConnection
+from opensearchpy import exceptions as opensearch_exceptions
 from opensearchpy import helpers as opensearch_helpers
 
 
@@ -26,13 +28,13 @@ def __init__(self, config):
         # Store the configuration
         self.config = config
         self.opensearch_client = None
-        self.aws_region = config.get('region')
-        self.index_name = config.get('index_name')
-        self.is_serverless = config.get('is_serverless', 'False') == 'True'
-        self.opensearch_endpoint = config.get('opensearch_endpoint')
-        self.opensearch_username = config.get('opensearch_username')
-        self.opensearch_password = config.get('opensearch_password')
-        self.service_type = config.get('service_type')
+        self.aws_region = config.get("region")
+        self.index_name = config.get("index_name")
+        self.is_serverless = config.get("is_serverless", "False") == "True"
+        self.opensearch_endpoint = config.get("opensearch_endpoint")
+        self.opensearch_username = config.get("opensearch_username")
+        self.opensearch_password = config.get("opensearch_password")
+        self.service_type = config.get("service_type")
 
     def initialize_opensearch_client(self) -> bool:
         """
@@ -48,20 +50,24 @@ def initialize_opensearch_client(self) -> bool:
         # Parse the OpenSearch endpoint URL
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200)  # Default ports
+        port = parsed_url.port or (
+            443 if parsed_url.scheme == "https" else 9200
+        )  # Default ports
 
         # Determine the authentication method based on the service type
-        if self.service_type == 'serverless':
+        if self.service_type == "serverless":
             # Use AWS V4 Signer Authentication for serverless
             credentials = boto3.Session().get_credentials()
-            auth = AWSV4SignerAuth(credentials, self.aws_region, 'aoss')
-        elif self.service_type == 'managed':
+            auth = AWSV4SignerAuth(credentials, self.aws_region, "aoss")
+        elif self.service_type == "managed":
             # Use basic authentication for managed services
             if not self.opensearch_username or not self.opensearch_password:
-                print("OpenSearch username or password not set. Please run setup first.")
+                print(
+                    "OpenSearch username or password not set. Please run setup first."
+                )
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
-        elif self.service_type == 'open-source':
+        elif self.service_type == "open-source":
             # Use basic authentication if credentials are provided, else no authentication
             if self.opensearch_username and self.opensearch_password:
                 auth = (self.opensearch_username, self.opensearch_password)
@@ -73,20 +79,22 @@ def initialize_opensearch_client(self) -> bool:
             return False
 
         # Determine SSL settings based on the endpoint scheme
-        use_ssl = parsed_url.scheme == 'https'
-        verify_certs = True  # Always verify certificates unless you have a specific reason not to
+        use_ssl = parsed_url.scheme == "https"
+        verify_certs = (
+            True  # Always verify certificates unless you have a specific reason not to
+        )
 
         try:
             # Initialize the OpenSearch client
             self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'port': port}],
+                hosts=[{"host": host, "port": port}],
                 http_auth=auth,
                 use_ssl=use_ssl,
                 verify_certs=verify_certs,
-                ssl_show_warn=False,          # Suppress SSL warnings
+                ssl_show_warn=False,  # Suppress SSL warnings
                 # ssl_context=ssl_context,      # Not needed unless you have custom certificates
                 connection_class=RequestsHttpConnection,
-                pool_maxsize=20
+                pool_maxsize=20,
             )
             print(f"Initialized OpenSearch client with host: {host} and port: {port}")
             return True
@@ -95,19 +103,26 @@ def initialize_opensearch_client(self) -> bool:
             print(f"Error initializing OpenSearch client: {ex}")
             return False
 
-
-    def create_index(self, embedding_dimension: int, space_type: str, ef_construction: int,
-                    number_of_shards: int, number_of_replicas: int,
-                    passage_text_field: str, passage_chunk_field: str, embedding_field: str):
+    def create_index(
+        self,
+        embedding_dimension: int,
+        space_type: str,
+        ef_construction: int,
+        number_of_shards: int,
+        number_of_replicas: int,
+        passage_text_field: str,
+        passage_chunk_field: str,
+        embedding_field: str,
+    ):
         """
-            Create a KNN index in OpenSearch with the specified parameters.
+        Create a KNN index in OpenSearch with the specified parameters.
 
-            :param embedding_dimension: The dimension of the embedding vectors.
-            :param space_type: The space type for the KNN algorithm (e.g., 'cosinesimil', 'l2').
-            :param ef_construction: ef_construction parameter for KNN
-            :param number_of_shards: Number of shards for the index
-            :param number_of_replicas: Number of replicas for the index
-            :param nominee_text_field: Field name for nominee text
+        :param embedding_dimension: The dimension of the embedding vectors.
+        :param space_type: The space type for the KNN algorithm (e.g., 'cosinesimil', 'l2').
+        :param ef_construction: ef_construction parameter for KNN
+        :param number_of_shards: Number of shards for the index
+        :param number_of_replicas: Number of replicas for the index
+        :param nominee_text_field: Field name for nominee text
         """
         # Define the index mapping and settings
         index_body = {
@@ -120,10 +135,10 @@ def create_index(self, embedding_dimension: int, space_type: str, ef_constructio
                         "properties": {
                             "knn": {
                                 "type": "knn_vector",
-                                "dimension": embedding_dimension
+                                "dimension": embedding_dimension,
                             }
-                        }
-                    }
+                        },
+                    },
                 }
             },
             "settings": {
@@ -138,8 +153,12 @@ def create_index(self, embedding_dimension: int, space_type: str, ef_constructio
 
         try:
             # Attempt to create the index
-            self.opensearch_client.indices.create(index=self.index_name, body=index_body)
-            print(f"KNN index '{self.index_name}' created successfully with the following settings:")
+            self.opensearch_client.indices.create(
+                index=self.index_name, body=index_body
+            )
+            print(
+                f"KNN index '{self.index_name}' created successfully with the following settings:"
+            )
             print(f"Embedding Dimension: {embedding_dimension}")
             print(f"Space Type: {space_type}")
             print(f"ef_construction: {ef_construction}")
@@ -150,15 +169,23 @@ def create_index(self, embedding_dimension: int, space_type: str, ef_constructio
             print(f"Embedding Field: '{embedding_field}'")
         except opensearch_exceptions.RequestError as e:
             # Handle cases where the index already exists
-            if 'resource_already_exists_exception' in str(e).lower():
+            if "resource_already_exists_exception" in str(e).lower():
                 print(f"Index '{self.index_name}' already exists.")
             else:
                 # Handle other index creation errors
                 print(f"Error creating index '{self.index_name}': {e}")
 
-    def verify_and_create_index(self, embedding_dimension: int, space_type: str, ef_construction: int,
-                                number_of_shards: int, number_of_replicas: int,
-                                passage_text_field: str, passage_chunk_field: str, embedding_field: str) -> bool:
+    def verify_and_create_index(
+        self,
+        embedding_dimension: int,
+        space_type: str,
+        ef_construction: int,
+        number_of_shards: int,
+        number_of_replicas: int,
+        passage_text_field: str,
+        passage_chunk_field: str,
+        embedding_field: str,
+    ) -> bool:
         """
         Verify if the index exists; if not, create it.
 
@@ -177,8 +204,16 @@ def verify_and_create_index(self, embedding_dimension: int, space_type: str, ef_
                 print(f"KNN index '{self.index_name}' already exists.")
             else:
                 # Create the index if it doesn't exist
-                self.create_index(embedding_dimension, space_type, ef_construction,
-                                number_of_shards, number_of_replicas, passage_text_field, passage_chunk_field, embedding_field)
+                self.create_index(
+                    embedding_dimension,
+                    space_type,
+                    ef_construction,
+                    number_of_shards,
+                    number_of_replicas,
+                    passage_text_field,
+                    passage_chunk_field,
+                    embedding_field,
+                )
             return True
         except Exception as ex:
             # Handle errors during verification or creation
@@ -194,9 +229,13 @@ def bulk_index(self, actions: list) -> tuple:
         """
         try:
             # Execute bulk indexing using OpenSearch helpers
-            success_count, error_info = opensearch_helpers.bulk(self.opensearch_client, actions)
+            success_count, error_info = opensearch_helpers.bulk(
+                self.opensearch_client, actions
+            )
             error_count = len(error_info)
-            print(f"Indexed {success_count} documents successfully. Failed to index {error_count} documents.")
+            print(
+                f"Indexed {success_count} documents successfully. Failed to index {error_count} documents."
+            )
             return success_count, error_count
         except Exception as e:
             # Handle bulk indexing errors
@@ -207,7 +246,7 @@ def search(self, query_text: str, model_id: str, k: int = 5) -> list:
         """
         Perform a neural search based on the query text and model ID.
         """
-        embedding_field = self.config.get('embedding_field', 'passage_embedding')
+        embedding_field = self.config.get("embedding_field", "passage_embedding")
 
         try:
             # Execute the search query using nested query
@@ -225,15 +264,15 @@ def search(self, query_text: str, model_id: str, k: int = 5) -> list:
                                     f"{embedding_field}.knn": {
                                         "query_text": query_text,
                                         "model_id": model_id,
-                                        "k": k
+                                        "k": k,
                                     }
                                 }
-                            }
+                            },
                         }
-                    }
-                }
+                    },
+                },
             )
-            return response['hits']['hits']
+            return response["hits"]["hits"]
         except Exception as e:
             # Handle search errors
             print(f"Error during search: {e}")
@@ -263,9 +302,9 @@ def search_by_vector(self, vector: list, k: int = 5) -> list:
         :return: A list of search hits.
         """
         # Retrieve field names from the config
-        embedding_field = self.config.get('embedding_field', 'passage_embedding')
-        passage_text_field = self.config.get('passage_text_field', 'passage_text')
-        passage_chunk_field = self.config.get('passage_chunk_field', 'passage_chunk')
+        embedding_field = self.config.get("embedding_field", "passage_embedding")
+        passage_text_field = self.config.get("passage_text_field", "passage_text")
+        passage_chunk_field = self.config.get("passage_chunk_field", "passage_chunk")
 
         try:
             # Execute the KNN search query using the correct field name
@@ -279,18 +318,15 @@ def search_by_vector(self, vector: list, k: int = 5) -> list:
                             "path": embedding_field,
                             "query": {
                                 "knn": {
-                                    f"{embedding_field}.knn": {
-                                        "vector": vector,
-                                        "k": k
-                                    }
+                                    f"{embedding_field}.knn": {"vector": vector, "k": k}
                                 }
-                            }
+                            },
                         }
-                    }
-                }
+                    },
+                },
             )
-            return response['hits']['hits']
+            return response["hits"]["hits"]
         except Exception as e:
             # Handle search errors
             print(f"Error during search: {e}")
-            return []
\ No newline at end of file
+            return []
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
index 1a899785..b6fd242d 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/query.py
@@ -6,16 +6,19 @@
 # GitHub history for details.
 
 import json
-from colorama import Fore, Style, init
 from typing import List
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import EmbeddingClient
-import requests
-import os
-import urllib3
+
 import boto3
-import time
 import tiktoken
+import urllib3
+from colorama import Fore, Style, init
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import (
+    EmbeddingClient,
+)
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
+    OpenSearchConnector,
+)
 
 # Disable insecure request warnings
 urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
@@ -38,24 +41,32 @@ def __init__(self, config):
         """
         # Store the configuration
         self.config = config
-        self.index_name = config.get('index_name')
+        self.index_name = config.get("index_name")
         self.opensearch = OpenSearchConnector(config)
-        self.embedding_model_id = config.get('embedding_model_id')
-        self.llm_model_id = config.get('llm_model_id')  # Get the LLM model ID from config
-        self.aws_region = config.get('region')
+        self.embedding_model_id = config.get("embedding_model_id")
+        self.llm_model_id = config.get(
+            "llm_model_id"
+        )  # Get the LLM model ID from config
+        self.aws_region = config.get("region")
         self.bedrock_client = None
-        self.embedding_client = None  # Will be initialized after OpenSearch client is ready
+        self.embedding_client = (
+            None  # Will be initialized after OpenSearch client is ready
+        )
 
         # Load LLM configurations from config
         self.llm_config = {
-            "maxTokenCount": int(config.get('llm_max_token_count', '1000')),
-            "temperature": float(config.get('llm_temperature', '0.7')),
-            "topP": float(config.get('llm_top_p', '0.9')),
-            "stopSequences": [s.strip() for s in config.get('llm_stop_sequences', '').split(',') if s.strip()]
+            "maxTokenCount": int(config.get("llm_max_token_count", "1000")),
+            "temperature": float(config.get("llm_temperature", "0.7")),
+            "topP": float(config.get("llm_top_p", "0.9")),
+            "stopSequences": [
+                s.strip()
+                for s in config.get("llm_stop_sequences", "").split(",")
+                if s.strip()
+            ],
         }
 
         # Set the default search method
-        self.default_search_method = self.config.get('default_search_method', 'neural')
+        self.default_search_method = self.config.get("default_search_method", "neural")
 
         # Initialize clients
         if not self.initialize_clients():
@@ -82,15 +93,21 @@ def initialize_clients(self) -> bool:
                 print("Embedding model ID is not set. Please run setup first.")
                 return False
 
-            self.embedding_client = EmbeddingClient(self.opensearch.opensearch_client, self.embedding_model_id)
+            self.embedding_client = EmbeddingClient(
+                self.opensearch.opensearch_client, self.embedding_model_id
+            )
 
             # Initialize Bedrock client only if LLM model ID is provided
             if self.llm_model_id:
                 try:
-                    self.bedrock_client = boto3.client('bedrock-runtime', region_name=self.aws_region)
+                    self.bedrock_client = boto3.client(
+                        "bedrock-runtime", region_name=self.aws_region
+                    )
                     print("Bedrock client initialized successfully.")
                 except Exception as e:
-                    print(f"{Fore.RED}Failed to initialize Bedrock client: {e}{Style.RESET_ALL}")
+                    print(
+                        f"{Fore.RED}Failed to initialize Bedrock client: {e}{Style.RESET_ALL}"
+                    )
                     return False
             return True
         else:
@@ -106,12 +123,15 @@ def extract_relevant_sentences(self, query: str, text: str) -> List[str]:
         :return: A list of relevant sentences.
         """
         # Lowercase and remove punctuation from query
-        query_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in query)
+        query_processed = "".join(
+            c.lower() if c.isalnum() or c.isspace() else " " for c in query
+        )
         query_words = set(query_processed.split())
 
         # Split text into sentences based on punctuation and newlines
         import re
-        sentences = re.split(r'[\n.!?]+', text)
+
+        sentences = re.split(r"[\n.!?]+", text)
 
         sentence_scores = []
         for sentence in sentences:
@@ -119,7 +139,9 @@ def extract_relevant_sentences(self, query: str, text: str) -> List[str]:
             if not sentence:
                 continue
             # Lowercase and remove punctuation from sentence
-            sentence_processed = ''.join(c.lower() if c.isalnum() or c.isspace() else ' ' for c in sentence)
+            sentence_processed = "".join(
+                c.lower() if c.isalnum() or c.isspace() else " " for c in sentence
+            )
             sentence_words = set(sentence_processed.split())
             common_words = query_words.intersection(sentence_words)
             score = len(common_words) / (len(query_words) + 1e-6)  # Normalized score
@@ -150,31 +172,30 @@ def bulk_query_neural(self, queries: List[str], k: int = 5) -> List[dict]:
                     # Collect the content from the retrieved documents
                     documents = []
                     for hit in hits:
-                        source = hit['_source']
-                        document = {
-                            'score': hit['_score'],
-                            'source': source
-                        }
+                        source = hit["_source"]
+                        document = {"score": hit["_score"], "source": source}
                         documents.append(document)
                     num_results = len(hits)
                 else:
                     documents = []
                     num_results = 0
-                    print(f"{Fore.YELLOW}Warning: No hits found for query '{query_text}'.{Style.RESET_ALL}")
-
-                results.append({
-                    'query': query_text,
-                    'documents': documents,
-                    'num_results': num_results
-                })
+                    print(
+                        f"{Fore.YELLOW}Warning: No hits found for query '{query_text}'.{Style.RESET_ALL}"
+                    )
+
+                results.append(
+                    {
+                        "query": query_text,
+                        "documents": documents,
+                        "num_results": num_results,
+                    }
+                )
             except Exception as ex:
                 # Handle search errors
-                print(f"{Fore.RED}Error performing search for query '{query_text}': {str(ex)}{Style.RESET_ALL}")
-                results.append({
-                    'query': query_text,
-                    'documents': [],
-                    'num_results': 0
-                })
+                print(
+                    f"{Fore.RED}Error performing search for query '{query_text}': {str(ex)}{Style.RESET_ALL}"
+                )
+                results.append({"query": query_text, "documents": [], "num_results": 0})
 
         return results
 
@@ -194,42 +215,39 @@ def bulk_query_semantic(self, queries: List[str], k: int = 5) -> List[dict]:
             if embedding:
                 query_vectors.append(embedding)
             else:
-                print(f"{Fore.RED}Failed to generate embedding for query: {query}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Failed to generate embedding for query: {query}{Style.RESET_ALL}"
+                )
                 query_vectors.append(None)
 
         results = []
         for i, vector in enumerate(query_vectors):
             if vector is None:
                 # Handle cases where embedding generation failed
-                results.append({
-                    'query': queries[i],
-                    'context': "",
-                    'num_results': 0
-                })
+                results.append({"query": queries[i], "context": "", "num_results": 0})
                 continue
             try:
                 # Perform vector-based search
                 hits = self.opensearch.search_by_vector(vector, k)
                 # Concatenate the retrieved passages as context
-                context = '\n'.join(
-                    [chunk for hit in hits for chunk in hit['_source'].get('passage_chunk', [])]
+                context = "\n".join(
+                    [
+                        chunk
+                        for hit in hits
+                        for chunk in hit["_source"].get("passage_chunk", [])
+                    ]
+                )
+                results.append(
+                    {"query": queries[i], "context": context, "num_results": len(hits)}
                 )
-                results.append({
-                    'query': queries[i],
-                    'context': context,
-                    'num_results': len(hits)
-                })
             except Exception as ex:
                 # Handle search errors
-                print(f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}")
-                results.append({
-                    'query': queries[i],
-                    'context': "",
-                    'num_results': 0
-                })
+                print(
+                    f"{Fore.RED}Error performing search for query '{queries[i]}': {ex}{Style.RESET_ALL}"
+                )
+                results.append({"query": queries[i], "context": "", "num_results": 0})
         return results
 
-
     def generate_answer(self, prompt: str, llm_config: dict) -> str:
         """
         Generate an answer using the configured Large Language Model (LLM).
@@ -240,7 +258,7 @@ def generate_answer(self, prompt: str, llm_config: dict) -> str:
         """
         try:
             max_input_tokens = 8192  # Max tokens for the model
-            expected_output_tokens = llm_config.get('maxTokenCount', 1000)
+            expected_output_tokens = llm_config.get("maxTokenCount", 1000)
             # Adjust the encoding based on the model
             encoding = tiktoken.get_encoding("cl100k_base")  # Use appropriate encoding
 
@@ -252,30 +270,33 @@ def generate_answer(self, prompt: str, llm_config: dict) -> str:
                 # Truncate the prompt to fit within the model's token limit
                 prompt_tokens = prompt_tokens[:allowable_input_tokens]
                 prompt = encoding.decode(prompt_tokens)
-                print(f"{Fore.YELLOW}Prompt truncated to {allowable_input_tokens} tokens.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.YELLOW}Prompt truncated to {allowable_input_tokens} tokens.{Style.RESET_ALL}"
+                )
 
             # Simplified LLM config with only supported parameters
             llm_config_simplified = {
-                'maxTokenCount': expected_output_tokens,
-                'temperature': llm_config.get('temperature', 0.7),
-                'topP': llm_config.get('topP', 1.0),
-                'stopSequences': llm_config.get('stopSequences', [])
+                "maxTokenCount": expected_output_tokens,
+                "temperature": llm_config.get("temperature", 0.7),
+                "topP": llm_config.get("topP", 1.0),
+                "stopSequences": llm_config.get("stopSequences", []),
             }
 
             # Prepare the body for the LLM inference request
-            body = json.dumps({
-                'inputText': prompt,
-                'textGenerationConfig': llm_config_simplified
-            })
+            body = json.dumps(
+                {"inputText": prompt, "textGenerationConfig": llm_config_simplified}
+            )
 
             # Invoke the LLM model using Bedrock client
-            response = self.bedrock_client.invoke_model(modelId=self.llm_model_id, body=body)
-            response_body = json.loads(response['body'].read())
-            results = response_body.get('results', [])
+            response = self.bedrock_client.invoke_model(
+                modelId=self.llm_model_id, body=body
+            )
+            response_body = json.loads(response["body"].read())
+            results = response_body.get("results", [])
             if not results:
                 print(f"{Fore.YELLOW}No results returned from LLM.{Style.RESET_ALL}")
                 return None
-            answer = results[0].get('outputText', '').strip()
+            answer = results[0].get("outputText", "").strip()
             return answer
         except Exception as ex:
             # Handle errors during answer generation
@@ -298,42 +319,50 @@ def query_command(self, queries: List[str], num_results: int = 5):
         while True:
             if not queries:
                 # Prompt the user for a new query
-                query_text = input("\nEnter a query (or type 'exit' to finish): ").strip()
-                if not query_text or query_text.lower() == 'exit':
+                query_text = input(
+                    "\nEnter a query (or type 'exit' to finish): "
+                ).strip()
+                if not query_text or query_text.lower() == "exit":
                     print("\nExiting query session.")
                     break
                 queries = [query_text]
 
-            if search_method == 'semantic_no_llm':
+            if search_method == "semantic_no_llm":
                 # Proceed with neural search
                 results = self.bulk_query_neural(queries, k=num_results)
 
                 for result in results:
                     print(f"\nQuery: {result['query']}")
-                    if result['documents']:
+                    if result["documents"]:
                         all_relevant_sentences = []
-                        for doc in result['documents']:
-                            passage_chunks = doc['source'].get('passage_chunk', [])
+                        for doc in result["documents"]:
+                            passage_chunks = doc["source"].get("passage_chunk", [])
                             if not passage_chunks:
                                 continue
                             for passage in passage_chunks:
                                 # Extract relevant sentences from each passage
-                                relevant_sentences = self.extract_relevant_sentences(result['query'], passage)
+                                relevant_sentences = self.extract_relevant_sentences(
+                                    result["query"], passage
+                                )
                                 all_relevant_sentences.extend(relevant_sentences)
 
                         if all_relevant_sentences:
                             # Output the top relevant sentences
                             print("\nAnswer:")
-                            for sentence in all_relevant_sentences[:1]:  # Display the top sentence
+                            for sentence in all_relevant_sentences[
+                                :1
+                            ]:  # Display the top sentence
                                 print(sentence)
                         else:
                             print("\nNo relevant sentences found.")
                     else:
                         print("\nNo documents found for this query.")
-            elif search_method == 'semantic_with_llm':
+            elif search_method == "semantic_with_llm":
                 # Proceed with semantic search
                 if not self.bedrock_client or not self.llm_model_id:
-                    print(f"\n{Fore.RED}LLM model is not configured. Please run setup to select an LLM model.{Style.RESET_ALL}")
+                    print(
+                        f"\n{Fore.RED}LLM model is not configured. Please run setup to select an LLM model.{Style.RESET_ALL}"
+                    )
                     return
 
                 # Use the LLM configurations from setup
@@ -345,8 +374,10 @@ def query_command(self, queries: List[str], num_results: int = 5):
                 for result in results:
                     print(f"\nQuery: {result['query']}")
 
-                    if not result['context']:
-                        print(f"\n{Fore.RED}No context available for this query.{Style.RESET_ALL}")
+                    if not result["context"]:
+                        print(
+                            f"\n{Fore.RED}No context available for this query.{Style.RESET_ALL}"
+                        )
                         continue
 
                     # Prepare the augmented prompt with context
@@ -369,4 +400,4 @@ def query_command(self, queries: List[str], num_results: int = 5):
                         print("\nFailed to generate an answer.")
 
             # After processing, reset queries to allow for the next input
-            queries = []
\ No newline at end of file
+            queries = []
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
index 35b7fb2b..c13df93e 100755
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python3  # SPDX-License-Identifier: Apache-2.0
+# SPDX-License-Identifier: Apache-2.0
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
@@ -12,12 +12,14 @@
 import argparse
 import configparser
 import sys
+
 from colorama import Fore, Style, init
 from rich.console import Console
 from rich.prompt import Prompt
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup import Setup
+
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest import Ingest
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.query import Query
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup import Setup
 
 # Initialize colorama for colored terminal output
 init(autoreset=True)
@@ -26,7 +28,7 @@
 console = Console()
 
 # Configuration file name
-CONFIG_FILE = 'config.ini'
+CONFIG_FILE = "config.ini"
 
 
 def load_config() -> dict:
@@ -37,10 +39,12 @@ def load_config() -> dict:
     """
     config = configparser.ConfigParser()
     config.read(CONFIG_FILE)
-    if 'DEFAULT' not in config:
-        console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] 'DEFAULT' section missing in {CONFIG_FILE}. Please run the setup command first.")
+    if "DEFAULT" not in config:
+        console.print(
+            f"[{Fore.RED}ERROR{Style.RESET_ALL}] 'DEFAULT' section missing in {CONFIG_FILE}. Please run the setup command first."
+        )
         sys.exit(1)
-    return config['DEFAULT']
+    return config["DEFAULT"]
 
 
 def save_config(config: dict):
@@ -50,13 +54,17 @@ def save_config(config: dict):
     :param config: Dictionary of configuration parameters.
     """
     parser = configparser.ConfigParser()
-    parser['DEFAULT'] = config
+    parser["DEFAULT"] = config
     try:
-        with open(CONFIG_FILE, 'w') as f:
+        with open(CONFIG_FILE, "w") as f:
             parser.write(f)
-        console.print(f"[{Fore.GREEN}SUCCESS{Style.RESET_ALL}] Configuration saved to {CONFIG_FILE}.")
+        console.print(
+            f"[{Fore.GREEN}SUCCESS{Style.RESET_ALL}] Configuration saved to {CONFIG_FILE}."
+        )
     except Exception as e:
-        console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] Failed to save configuration: {e}")
+        console.print(
+            f"[{Fore.RED}ERROR{Style.RESET_ALL}] Failed to save configuration: {e}"
+        )
 
 
 def main():
@@ -80,42 +88,33 @@ def main():
 
 Execute queries with a specified number of results:
   rag query --queries "What is OpenSearch?" --num_results 3
-"""
+""",
     )
     subparsers = parser.add_subparsers(title="Available Commands", dest="command")
 
     # Setup command
-    setup_parser = subparsers.add_parser(
-        'setup',
-        help='Initialize and configure the RAG pipeline.'
-    )
+    subparsers.add_parser("setup", help="Initialize and configure the RAG pipeline.")
 
     # Ingest command
     ingest_parser = subparsers.add_parser(
-        'ingest',
-        help='Ingest documents into OpenSearch.'
+        "ingest", help="Ingest documents into OpenSearch."
     )
     ingest_parser.add_argument(
-        '--paths',
-        nargs='+',
-        help='Paths to files or directories for ingestion.'
+        "--paths", nargs="+", help="Paths to files or directories for ingestion."
     )
 
     # Query command
     query_parser = subparsers.add_parser(
-        'query',
-        help='Execute queries and generate answers.'
+        "query", help="Execute queries and generate answers."
     )
     query_parser.add_argument(
-        '--queries',
-        nargs='+',
-        help='Query texts for search and answer generation.'
+        "--queries", nargs="+", help="Query texts for search and answer generation."
     )
     query_parser.add_argument(
-        '--num_results',
+        "--num_results",
         type=int,
         default=5,
-        help='Number of top results to retrieve for each query. (default: 5)'
+        help="Number of top results to retrieve for each query. (default: 5)",
     )
 
     # Parse arguments
@@ -124,52 +123,66 @@ def main():
     # Only display the banner if no command is executed
     if not args.command:
         console.print("[bold cyan]Welcome to the RAG Pipeline[/bold cyan]")
-        console.print("Use [bold blue]rag setup[/bold blue], [bold blue]rag ingest[/bold blue], or [bold blue]rag query[/bold blue] to begin.\n")
+        console.print(
+            "Use [bold blue]rag setup[/bold blue], [bold blue]rag ingest[/bold blue], or [bold blue]rag query[/bold blue] to begin.\n"
+        )
 
     # Load existing configuration if not running setup
-    if args.command != 'setup' and args.command:
+    if args.command != "setup" and args.command:
         config = load_config()
     else:
         config = None  # Setup may create the config
 
     # Handle commands
-    if args.command == 'setup':
+    if args.command == "setup":
         # Run setup process
         setup = Setup()
         console.print("[bold blue]Starting setup process...[/bold blue]")
         setup.setup_command()
         save_config(setup.config)
-    elif args.command == 'ingest':
+    elif args.command == "ingest":
         # Handle ingestion command
         if not args.paths:
             # If no paths provided as arguments, prompt user for input
             paths = []
             while True:
-                path = Prompt.ask("Enter a file or directory path (or press Enter to finish)", default="", show_default=False)
+                path = Prompt.ask(
+                    "Enter a file or directory path (or press Enter to finish)",
+                    default="",
+                    show_default=False,
+                )
                 if not path:
                     break
                 paths.append(path)
         else:
             paths = args.paths
         if not paths:
-            console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] No paths provided for ingestion. Aborting.")
+            console.print(
+                f"[{Fore.RED}ERROR{Style.RESET_ALL}] No paths provided for ingestion. Aborting."
+            )
             sys.exit(1)
         ingest = Ingest(config)
         ingest.ingest_command(paths)
-    elif args.command == 'query':
+    elif args.command == "query":
         # Handle query command
         if not args.queries:
             # If no queries provided as arguments, prompt user for input
             queries = []
             while True:
-                query = Prompt.ask("Enter a query (or press Enter to finish)", default="", show_default=False)
+                query = Prompt.ask(
+                    "Enter a query (or press Enter to finish)",
+                    default="",
+                    show_default=False,
+                )
                 if not query:
                     break
                 queries.append(query)
         else:
             queries = args.queries
         if not queries:
-            console.print(f"[{Fore.RED}ERROR{Style.RESET_ALL}] No queries provided. Aborting.")
+            console.print(
+                f"[{Fore.RED}ERROR{Style.RESET_ALL}] No queries provided. Aborting."
+            )
             sys.exit(1)
         query = Query(config)
         query.query_command(queries, num_results=args.num_results)
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index d499ff64..906abdf1 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -5,24 +5,24 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import boto3
-import botocore
-from botocore.config import Config
 import configparser
-import subprocess
 import os
-import json
-import time
+import subprocess
+import sys
 import termios
+import time
 import tty
-import sys
 from urllib.parse import urlparse
-from opensearchpy import OpenSearch, RequestsHttpConnection, AWSV4SignerAuth
+
+import boto3
+from botocore.config import Config
 from colorama import Fore, Style, init
+from opensearchpy import OpenSearch, RequestsHttpConnection
 
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
+    OpenSearchConnector,
+)
 
 # Initialize colorama for colored terminal output
 init(autoreset=True)
@@ -34,9 +34,9 @@ class Setup:
     Manages AWS credentials (if managed), OpenSearch client initialization, index creation,
     and model registration.
     """
-    
-    CONFIG_FILE = 'config.ini'
-    SERVICE_BEDROCK = 'bedrock-runtime'
+
+    CONFIG_FILE = "config.ini"
+    SERVICE_BEDROCK = "bedrock-runtime"
 
     def __init__(self):
         """
@@ -44,13 +44,13 @@ def __init__(self):
         """
         # Load existing configuration
         self.config = self.load_config()
-        self.aws_region = self.config.get('region', 'us-west-2')
-        self.iam_principal = self.config.get('iam_principal', '')
-        self.collection_name = self.config.get('collection_name', '')
-        self.opensearch_endpoint = self.config.get('opensearch_endpoint', '')
-        self.service_type = self.config.get('service_type', 'managed')
-        self.opensearch_username = self.config.get('opensearch_username', '')
-        self.opensearch_password = self.config.get('opensearch_password', '')
+        self.aws_region = self.config.get("region", "us-west-2")
+        self.iam_principal = self.config.get("iam_principal", "")
+        self.collection_name = self.config.get("collection_name", "")
+        self.opensearch_endpoint = self.config.get("opensearch_endpoint", "")
+        self.service_type = self.config.get("service_type", "managed")
+        self.opensearch_username = self.config.get("opensearch_username", "")
+        self.opensearch_password = self.config.get("opensearch_password", "")
         self.bedrock_client = None
         self.opensearch_client = None
         self.opensearch_domain_name = self.get_opensearch_domain_name()
@@ -65,15 +65,19 @@ def check_and_configure_aws(self):
             credentials = session.get_credentials()
 
             if credentials is None:
-                print(f"{Fore.YELLOW}AWS credentials are not configured.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.YELLOW}AWS credentials are not configured.{Style.RESET_ALL}"
+                )
                 self.configure_aws()
             else:
                 print("AWS credentials are already configured.")
                 reconfigure = input("Do you want to reconfigure? (yes/no): ").lower()
-                if reconfigure == 'yes':
+                if reconfigure == "yes":
                     self.configure_aws()
         except Exception as e:
-            print(f"{Fore.RED}An error occurred while checking AWS credentials: {e}{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}An error occurred while checking AWS credentials: {e}{Style.RESET_ALL}"
+            )
             self.configure_aws()
 
     def configure_aws(self):
@@ -83,29 +87,43 @@ def configure_aws(self):
         print("Let's configure your AWS credentials.")
 
         aws_access_key_id = input("Enter your AWS Access Key ID: ").strip()
-        aws_secret_access_key = self.get_password_with_asterisks("Enter your AWS Secret Access Key: ")
-        aws_region_input = input(f"Enter your preferred AWS region [{self.aws_region}]: ").strip() or self.aws_region
+        aws_secret_access_key = self.get_password_with_asterisks(
+            "Enter your AWS Secret Access Key: "
+        )
+        aws_region_input = (
+            input(f"Enter your preferred AWS region [{self.aws_region}]: ").strip()
+            or self.aws_region
+        )
 
         try:
             # Configure AWS credentials using subprocess to call AWS CLI
-            subprocess.run([
-                'aws', 'configure', 'set', 
-                'aws_access_key_id', aws_access_key_id
-            ], check=True)
-            
-            subprocess.run([
-                'aws', 'configure', 'set', 
-                'aws_secret_access_key', aws_secret_access_key
-            ], check=True)
-            
-            subprocess.run([
-                'aws', 'configure', 'set', 
-                'region', aws_region_input
-            ], check=True)
-            
-            print(f"{Fore.GREEN}AWS credentials have been successfully configured.{Style.RESET_ALL}")
+            subprocess.run(
+                ["aws", "configure", "set", "aws_access_key_id", aws_access_key_id],
+                check=True,
+            )
+
+            subprocess.run(
+                [
+                    "aws",
+                    "configure",
+                    "set",
+                    "aws_secret_access_key",
+                    aws_secret_access_key,
+                ],
+                check=True,
+            )
+
+            subprocess.run(
+                ["aws", "configure", "set", "region", aws_region_input], check=True
+            )
+
+            print(
+                f"{Fore.GREEN}AWS credentials have been successfully configured.{Style.RESET_ALL}"
+            )
         except subprocess.CalledProcessError as e:
-            print(f"{Fore.RED}An error occurred while configuring AWS credentials: {e}{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}An error occurred while configuring AWS credentials: {e}{Style.RESET_ALL}"
+            )
         except Exception as e:
             print(f"{Fore.RED}An unexpected error occurred: {e}{Style.RESET_ALL}")
 
@@ -116,32 +134,33 @@ def load_config(self) -> dict:
         config = configparser.ConfigParser()
         if os.path.exists(self.CONFIG_FILE):
             config.read(self.CONFIG_FILE)
-            return dict(config['DEFAULT'])
+            return dict(config["DEFAULT"])
         return {}
 
     def get_password_with_asterisks(self, prompt="Enter password: ") -> str:
         """
         Get password input from user, masking it with asterisks.
         """
-        if sys.platform == 'win32':
+        if sys.platform == "win32":
             import msvcrt
-            print(prompt, end='', flush=True)
+
+            print(prompt, end="", flush=True)
             password = ""
             while True:
                 key = msvcrt.getch()
-                if key == b'\r':  # Enter key
-                    sys.stdout.write('\n')
+                if key == b"\r":  # Enter key
+                    sys.stdout.write("\n")
                     return password
-                elif key == b'\x08':  # Backspace key
+                elif key == b"\x08":  # Backspace key
                     if len(password) > 0:
                         password = password[:-1]
-                        sys.stdout.write('\b \b')  # Erase the last asterisk
+                        sys.stdout.write("\b \b")  # Erase the last asterisk
                         sys.stdout.flush()
                 else:
                     try:
-                        char = key.decode('utf-8')
+                        char = key.decode("utf-8")
                         password += char
-                        sys.stdout.write('*')  # Mask input with '*'
+                        sys.stdout.write("*")  # Mask input with '*'
                         sys.stdout.flush()
                     except UnicodeDecodeError:
                         continue
@@ -155,17 +174,17 @@ def get_password_with_asterisks(self, prompt="Enter password: ") -> str:
                 password = ""
                 while True:
                     ch = sys.stdin.read(1)
-                    if ch in ('\r', '\n'):  # Enter key
-                        sys.stdout.write('\n')
+                    if ch in ("\r", "\n"):  # Enter key
+                        sys.stdout.write("\n")
                         return password
-                    elif ch == '\x7f':  # Backspace key
+                    elif ch == "\x7f":  # Backspace key
                         if len(password) > 0:
                             password = password[:-1]
-                            sys.stdout.write('\b \b')  # Erase the last asterisk
+                            sys.stdout.write("\b \b")  # Erase the last asterisk
                             sys.stdout.flush()
                     else:
                         password += ch
-                        sys.stdout.write('*')  # Mask input with '*'
+                        sys.stdout.write("*")  # Mask input with '*'
                         sys.stdout.flush()
             finally:
                 termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
@@ -174,7 +193,7 @@ def setup_configuration(self):
         """
         Set up the configuration by prompting the user for various settings.
         """
-        config = self.load_config()
+        self.load_config()
 
         # Prompt for service type
         print("\nChoose OpenSearch service type:")
@@ -182,49 +201,82 @@ def setup_configuration(self):
         print("2. Open-source")
         service_choice = input("Enter your choice (1-2): ").strip()
 
-        if service_choice == '1':
-            self.service_type = 'managed'
-        elif service_choice == '2':
-            self.service_type = 'open-source'
+        if service_choice == "1":
+            self.service_type = "managed"
+        elif service_choice == "2":
+            self.service_type = "open-source"
         else:
-            print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'managed'.{Style.RESET_ALL}")
-            self.service_type = 'managed'
+            print(
+                f"\n{Fore.YELLOW}Invalid choice. Defaulting to 'managed'.{Style.RESET_ALL}"
+            )
+            self.service_type = "managed"
 
         # Based on service type, prompt for different configurations
-        if self.service_type == 'managed':
+        if self.service_type == "managed":
             self.check_and_configure_aws()
-            self.aws_region = input(f"\nEnter your AWS Region [{self.aws_region}]: ").strip() or self.aws_region
-            self.iam_principal = input(f"Enter your IAM Principal ARN [{self.iam_principal}]: ").strip() or self.iam_principal
-            self.opensearch_endpoint = input("\nEnter your OpenSearch domain endpoint: ").strip()
+            self.aws_region = (
+                input(f"\nEnter your AWS Region [{self.aws_region}]: ").strip()
+                or self.aws_region
+            )
+            self.iam_principal = (
+                input(f"Enter your IAM Principal ARN [{self.iam_principal}]: ").strip()
+                or self.iam_principal
+            )
+            self.opensearch_endpoint = input(
+                "\nEnter your OpenSearch domain endpoint: "
+            ).strip()
             self.opensearch_username = input("Enter your OpenSearch username: ").strip()
-            self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
-            self.collection_name = ''
-        elif self.service_type == 'open-source':
+            self.opensearch_password = self.get_password_with_asterisks(
+                "Enter your OpenSearch password: "
+            )
+            self.collection_name = ""
+        elif self.service_type == "open-source":
             # For open-source, skip AWS configurations
             print("\n--- Open-source OpenSearch Setup ---")
-            default_endpoint = 'https://localhost:9200'
-            self.opensearch_endpoint = input(f"\nPress Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: ").strip() or default_endpoint
-            auth_required = input("Does your OpenSearch instance require authentication? (yes/no): ").strip().lower()
-            if auth_required == 'yes':
-                self.opensearch_username = input("Enter your OpenSearch username: ").strip()
-                self.opensearch_password = self.get_password_with_asterisks("Enter your OpenSearch password: ")
+            default_endpoint = "https://localhost:9200"
+            self.opensearch_endpoint = (
+                input(
+                    f"\nPress Enter to use the default endpoint (or type your custom endpoint) [{default_endpoint}]: "
+                ).strip()
+                or default_endpoint
+            )
+            auth_required = (
+                input(
+                    "Does your OpenSearch instance require authentication? (yes/no): "
+                )
+                .strip()
+                .lower()
+            )
+            if auth_required == "yes":
+                self.opensearch_username = input(
+                    "Enter your OpenSearch username: "
+                ).strip()
+                self.opensearch_password = self.get_password_with_asterisks(
+                    "Enter your OpenSearch password: "
+                )
             else:
                 self.opensearch_username = None
                 self.opensearch_password = None
-            self.collection_name = ''
+            self.collection_name = ""
             # AWS region and IAM principal not needed
-            self.aws_region = ''
-            self.iam_principal = ''
+            self.aws_region = ""
+            self.iam_principal = ""
 
         # Update configuration dictionary
         self.config = {
-            'service_type': self.service_type,
-            'region': self.aws_region,
-            'iam_principal': self.iam_principal,
-            'collection_name': self.collection_name if self.collection_name else '',
-            'opensearch_endpoint': self.opensearch_endpoint if self.opensearch_endpoint else '',
-            'opensearch_username': self.opensearch_username if self.opensearch_username else '',
-            'opensearch_password': self.opensearch_password if self.opensearch_password else ''
+            "service_type": self.service_type,
+            "region": self.aws_region,
+            "iam_principal": self.iam_principal,
+            "collection_name": self.collection_name if self.collection_name else "",
+            "opensearch_endpoint": (
+                self.opensearch_endpoint if self.opensearch_endpoint else ""
+            ),
+            "opensearch_username": (
+                self.opensearch_username if self.opensearch_username else ""
+            ),
+            "opensearch_password": (
+                self.opensearch_password if self.opensearch_password else ""
+            ),
         }
 
         # Now, prompt for default search method
@@ -234,44 +286,58 @@ def setup_configuration(self):
         print("2. Semantic search WITHOUT LLM")
         search_choice = input("Enter your choice (1-2): ").strip()
 
-        if search_choice == '1':
-            default_search_method = 'semantic_with_llm'
+        if search_choice == "1":
+            default_search_method = "semantic_with_llm"
         else:
-            default_search_method = 'semantic_no_llm'
+            default_search_method = "semantic_no_llm"
 
-        self.config['default_search_method'] = default_search_method
+        self.config["default_search_method"] = default_search_method
 
         # If semantic with LLM chosen and we are in managed mode, prompt for LLM configuration
-        if default_search_method == 'semantic_with_llm' and self.service_type == 'managed':
+        if (
+            default_search_method == "semantic_with_llm"
+            and self.service_type == "managed"
+        ):
             print("\nSelect an LLM model for semantic search:")
             available_models = [
                 ("amazon.titan-text-lite-v1", "Bedrock Titan Text Lite V1"),
                 ("amazon.titan-text-express-v1", "Bedrock Titan Text Express V1"),
-                ("anthropic.claude-3-5-sonnet-20240620-v1:0", "Anthropic Claude 3.5 Sonnet"),
+                (
+                    "anthropic.claude-3-5-sonnet-20240620-v1:0",
+                    "Anthropic Claude 3.5 Sonnet",
+                ),
                 ("anthropic.claude-3-opus-20240229-v1:0", "Anthropic Claude 3 Opus"),
                 ("cohere.command-r-plus-v1:0", "Cohere Command R Plus V1"),
-                ("cohere.command-r-v1:0", "Cohere Command R V1")
+                ("cohere.command-r-v1:0", "Cohere Command R V1"),
             ]
             for idx, (model_id, model_name) in enumerate(available_models, start=1):
                 print(f"{idx}. {model_name} ({model_id})")
-            model_choice = input(f"\nEnter the number of your chosen model (1-{len(available_models)}): ").strip()
+            model_choice = input(
+                f"\nEnter the number of your chosen model (1-{len(available_models)}): "
+            ).strip()
             try:
                 model_choice_idx = int(model_choice) - 1
                 if 0 <= model_choice_idx < len(available_models):
                     selected_model_id = available_models[model_choice_idx][0]
-                    self.config['llm_model_id'] = selected_model_id
+                    self.config["llm_model_id"] = selected_model_id
                     print(f"\nSelected LLM Model ID: {selected_model_id}")
                 else:
-                    print(f"\n{Fore.YELLOW}Invalid choice. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}")
-                    self.config['llm_model_id'] = available_models[0][0]
+                    print(
+                        f"\n{Fore.YELLOW}Invalid choice. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}"
+                    )
+                    self.config["llm_model_id"] = available_models[0][0]
             except ValueError:
-                print(f"\n{Fore.YELLOW}Invalid input. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}")
-                self.config['llm_model_id'] = available_models[0][0]
+                print(
+                    f"\n{Fore.YELLOW}Invalid input. Defaulting to '{available_models[0][0]}'.{Style.RESET_ALL}"
+                )
+                self.config["llm_model_id"] = available_models[0][0]
 
             # Prompt for LLM configurations
             print("\nConfigure LLM settings:")
             try:
-                maxTokenCount = int(input("Enter max token count [1000]: ").strip() or "1000")
+                maxTokenCount = int(
+                    input("Enter max token count [1000]: ").strip() or "1000"
+                )
             except ValueError:
                 maxTokenCount = 1000
             try:
@@ -282,57 +348,69 @@ def setup_configuration(self):
                 topP = float(input("Enter topP [0.9]: ").strip() or "0.9")
             except ValueError:
                 topP = 0.9
-            stopSequences_input = input("Enter stop sequences (comma-separated) or press Enter for none: ").strip()
+            stopSequences_input = input(
+                "Enter stop sequences (comma-separated) or press Enter for none: "
+            ).strip()
             if stopSequences_input:
-                stopSequences = [s.strip() for s in stopSequences_input.split(',')]
+                stopSequences = [s.strip() for s in stopSequences_input.split(",")]
             else:
                 stopSequences = []
 
             # Save LLM configurations to config
-            self.config['llm_max_token_count'] = str(maxTokenCount)
-            self.config['llm_temperature'] = str(temperature)
-            self.config['llm_top_p'] = str(topP)
-            self.config['llm_stop_sequences'] = ','.join(stopSequences)
+            self.config["llm_max_token_count"] = str(maxTokenCount)
+            self.config["llm_temperature"] = str(temperature)
+            self.config["llm_top_p"] = str(topP)
+            self.config["llm_stop_sequences"] = ",".join(stopSequences)
         else:
             # No LLM configurations needed
-            self.config['llm_model_id'] = ''
-            self.config['llm_max_token_count'] = ''
-            self.config['llm_temperature'] = ''
-            self.config['llm_top_p'] = ''
-            self.config['llm_stop_sequences'] = ''
+            self.config["llm_model_id"] = ""
+            self.config["llm_max_token_count"] = ""
+            self.config["llm_temperature"] = ""
+            self.config["llm_top_p"] = ""
+            self.config["llm_stop_sequences"] = ""
 
         # Prompt for ingest pipeline name
-        default_pipeline_name = 'text-chunking-ingest-pipeline'
-        pipeline_name = input(f"\nEnter the name of the ingest pipeline to use [{default_pipeline_name}]: ").strip()
+        default_pipeline_name = "text-chunking-ingest-pipeline"
+        pipeline_name = input(
+            f"\nEnter the name of the ingest pipeline to use [{default_pipeline_name}]: "
+        ).strip()
         if not pipeline_name:
             pipeline_name = default_pipeline_name
 
         # Save the pipeline name to config
-        self.config['ingest_pipeline_name'] = pipeline_name
+        self.config["ingest_pipeline_name"] = pipeline_name
 
         # Save the configuration
         self.save_config(self.config)
-        print(f"\n{Fore.GREEN}Configuration saved successfully to {os.path.abspath(self.CONFIG_FILE)}.{Style.RESET_ALL}\n")
+        print(
+            f"\n{Fore.GREEN}Configuration saved successfully to {os.path.abspath(self.CONFIG_FILE)}.{Style.RESET_ALL}\n"
+        )
 
     def initialize_clients(self) -> bool:
         """
         Initialize AWS clients (Bedrock) only if managed. No AWS clients needed for open-source.
         """
-        if self.service_type == 'open-source':
+        if self.service_type == "open-source":
             return True  # No AWS clients needed
         # Managed: Initialize Bedrock
         try:
             boto_config = Config(
                 region_name=self.aws_region,
-                signature_version='v4',
-                retries={'max_attempts': 10, 'mode': 'standard'}
+                signature_version="v4",
+                retries={"max_attempts": 10, "mode": "standard"},
+            )
+            self.bedrock_client = boto3.client(
+                self.SERVICE_BEDROCK, region_name=self.aws_region, config=boto_config
             )
-            self.bedrock_client = boto3.client(self.SERVICE_BEDROCK, region_name=self.aws_region, config=boto_config)
             time.sleep(2)
-            print(f"{Fore.GREEN}AWS Bedrock client initialized successfully.{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.GREEN}AWS Bedrock client initialized successfully.{Style.RESET_ALL}\n"
+            )
             return True
         except Exception as e:
-            print(f"{Fore.RED}Failed to initialize AWS Bedrock client: {e}{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Failed to initialize AWS Bedrock client: {e}{Style.RESET_ALL}"
+            )
             return False
 
     def get_opensearch_domain_name(self) -> str:
@@ -343,21 +421,21 @@ def get_opensearch_domain_name(self) -> str:
         """
         if self.opensearch_endpoint:
             parsed_url = urlparse(self.opensearch_endpoint)
-            hostname = parsed_url.hostname  # e.g., 'search-your-domain-name-uniqueid.region.es.amazonaws.com'
+            hostname = (
+                parsed_url.hostname
+            )  # e.g., 'search-your-domain-name-uniqueid.region.es.amazonaws.com'
             if hostname:
                 # Split the hostname into parts
-                parts = hostname.split('.')
+                parts = hostname.split(".")
                 domain_part = parts[0]  # e.g., 'search-your-domain-name-uniqueid'
                 # Remove the 'search-' prefix if present
-                if domain_part.startswith('search-'):
-                    domain_part = domain_part[len('search-'):]
+                if domain_part.startswith("search-"):
+                    domain_part = domain_part[len("search-") :]
                 # Remove the unique ID suffix after the domain name
-                domain_name = domain_part.rsplit('-', 1)[0]
+                domain_name = domain_part.rsplit("-", 1)[0]
                 print(f"Extracted domain name: {domain_name}\n")
                 return domain_name
         return None
-    
-
 
     @staticmethod
     def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
@@ -365,14 +443,18 @@ def get_opensearch_domain_info(region: str, domain_name: str) -> tuple:
         Retrieve the OpenSearch domain endpoint and ARN for a managed domain.
         """
         try:
-            client = boto3.client('opensearch', region_name=region)
+            client = boto3.client("opensearch", region_name=region)
             response = client.describe_domain(DomainName=domain_name)
-            domain_status = response['DomainStatus']
-            domain_endpoint = domain_status.get('Endpoint') or domain_status.get('Endpoints', {}).get('vpc')
-            domain_arn = domain_status['ARN']
+            domain_status = response["DomainStatus"]
+            domain_endpoint = domain_status.get("Endpoint") or domain_status.get(
+                "Endpoints", {}
+            ).get("vpc")
+            domain_arn = domain_status["ARN"]
             return domain_endpoint, domain_arn
         except Exception as e:
-            print(f"{Fore.RED}Error retrieving OpenSearch domain info: {e}{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Error retrieving OpenSearch domain info: {e}{Style.RESET_ALL}"
+            )
             return None, None
 
     def initialize_opensearch_client(self) -> bool:
@@ -380,20 +462,24 @@ def initialize_opensearch_client(self) -> bool:
         Initialize the OpenSearch client based on the service type and configuration.
         """
         if not self.opensearch_endpoint:
-            print(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n"
+            )
             return False
 
         parsed_url = urlparse(self.opensearch_endpoint)
         host = parsed_url.hostname
-        port = parsed_url.port or (443 if parsed_url.scheme == 'https' else 9200) 
+        port = parsed_url.port or (443 if parsed_url.scheme == "https" else 9200)
 
         # Determine auth based on service type
-        if self.service_type == 'managed':
+        if self.service_type == "managed":
             if not self.opensearch_username or not self.opensearch_password:
-                print(f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n")
+                print(
+                    f"{Fore.RED}OpenSearch username or password not set. Please run setup first.{Style.RESET_ALL}\n"
+                )
                 return False
             auth = (self.opensearch_username, self.opensearch_password)
-        elif self.service_type == 'open-source':
+        elif self.service_type == "open-source":
             if self.opensearch_username and self.opensearch_password:
                 auth = (self.opensearch_username, self.opensearch_password)
             else:
@@ -402,30 +488,36 @@ def initialize_opensearch_client(self) -> bool:
             print("Invalid service type. Please check your configuration.")
             return False
 
-        use_ssl = parsed_url.scheme == 'https'
+        use_ssl = parsed_url.scheme == "https"
         verify_certs = True
 
         try:
             self.opensearch_client = OpenSearch(
-                hosts=[{'host': host, 'port': port}],
+                hosts=[{"host": host, "port": port}],
                 http_auth=auth,
                 use_ssl=use_ssl,
                 verify_certs=verify_certs,
                 ssl_show_warn=False,
                 connection_class=RequestsHttpConnection,
-                pool_maxsize=20
+                pool_maxsize=20,
+            )
+            print(
+                f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n"
             )
-            print(f"{Fore.GREEN}Initialized OpenSearch client with host: {host} and port: {port}{Style.RESET_ALL}\n")
             return True
         except Exception as ex:
-            print(f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.RED}Error initializing OpenSearch client: {ex}{Style.RESET_ALL}\n"
+            )
             return False
 
     def get_knn_index_details(self) -> tuple:
         """
         Prompt user for KNN index details.
         """
-        dimension_input = input("Press Enter to use the default embedding size (768), or type a custom size: ").strip()
+        dimension_input = input(
+            "Press Enter to use the default embedding size (768), or type a custom size: "
+        ).strip()
         if dimension_input == "":
             embedding_dimension = 768
         else:
@@ -442,7 +534,9 @@ def get_knn_index_details(self) -> tuple:
         print("1. L2 (Euclidean distance)")
         print("2. Cosine similarity")
         print("3. Inner product")
-        space_choice = input("Enter your choice (1-3), or press Enter for default (L2): ").strip()
+        space_choice = input(
+            "Enter your choice (1-3), or press Enter for default (L2): "
+        ).strip()
 
         if space_choice == "" or space_choice == "1":
             space_type = "l2"
@@ -457,7 +551,9 @@ def get_knn_index_details(self) -> tuple:
         print(f"Space type set to: {space_type}")
 
         # Prompt for ef_construction
-        ef_construction_input = input("\nPress Enter to use the default ef_construction value (512), or type a custom value: ").strip()
+        ef_construction_input = input(
+            "\nPress Enter to use the default ef_construction value (512), or type a custom value: "
+        ).strip()
         if ef_construction_input == "":
             ef_construction = 512
         else:
@@ -470,7 +566,9 @@ def get_knn_index_details(self) -> tuple:
         print(f"ef_construction set to: {ef_construction}\n")
 
         # Prompt for number of shards
-        shards_input = input("\nEnter number of shards (Press Enter for default value 1): ").strip()
+        shards_input = input(
+            "\nEnter number of shards (Press Enter for default value 1): "
+        ).strip()
         if shards_input == "":
             number_of_shards = 1
         else:
@@ -482,7 +580,9 @@ def get_knn_index_details(self) -> tuple:
         print(f"Number of shards set to: {number_of_shards}")
 
         # Prompt for number of replicas
-        replicas_input = input("\nEnter number of replicas (Press Enter for default value 2): ").strip()
+        replicas_input = input(
+            "\nEnter number of replicas (Press Enter for default value 2): "
+        ).strip()
         if replicas_input == "":
             number_of_replicas = 2
         else:
@@ -494,33 +594,48 @@ def get_knn_index_details(self) -> tuple:
         print(f"Number of replicas set to: {number_of_replicas}")
 
         # Prompt for passage_text field name
-        passage_text_field = input("\nEnter the field name for text content (Press Enter for default 'passage_text'): ").strip()
+        passage_text_field = input(
+            "\nEnter the field name for text content (Press Enter for default 'passage_text'): "
+        ).strip()
         if passage_text_field == "":
             passage_text_field = "passage_text"
         print(f"Text content field name set to: {passage_text_field}")
 
         # Prompt for passage_chunk field name
-        passage_chunk_field = input("\nEnter the field name for passage chunks (Press Enter for default 'passage_chunk'): ").strip()
+        passage_chunk_field = input(
+            "\nEnter the field name for passage chunks (Press Enter for default 'passage_chunk'): "
+        ).strip()
         if passage_chunk_field == "":
             passage_chunk_field = "passage_chunk"
         print(f"Passage chunk field name set to: {passage_chunk_field}")
 
         # Prompt for embedding field name
-        embedding_field = input("\nEnter the field name for embeddings (Press Enter for default 'passage_embedding'): ").strip()
+        embedding_field = input(
+            "\nEnter the field name for embeddings (Press Enter for default 'passage_embedding'): "
+        ).strip()
         if embedding_field == "":
             embedding_field = "passage_embedding"
         print(f"Embedding field name set to: {embedding_field}")
 
-        return embedding_dimension, space_type, ef_construction, number_of_shards, number_of_replicas, passage_text_field, passage_chunk_field, embedding_field
+        return (
+            embedding_dimension,
+            space_type,
+            ef_construction,
+            number_of_shards,
+            number_of_replicas,
+            passage_text_field,
+            passage_chunk_field,
+            embedding_field,
+        )
 
     def save_config(self, config: dict):
         """
         Save configuration to the config file.
         """
         parser = configparser.ConfigParser()
-        parser['DEFAULT'] = config
-        config_path = os.path.abspath(self.CONFIG_FILE)
-        with open(self.CONFIG_FILE, 'w') as f:
+        parser["DEFAULT"] = config
+        os.path.abspath(self.CONFIG_FILE)
+        with open(self.CONFIG_FILE, "w") as f:
             parser.write(f)
 
     def setup_command(self):
@@ -530,20 +645,26 @@ def setup_command(self):
         # Begin setup by configuring necessary parameters
         self.setup_configuration()
 
-        if self.service_type == 'managed' and not self.initialize_clients():
-            print(f"\n{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n")
+        if self.service_type == "managed" and not self.initialize_clients():
+            print(
+                f"\n{Fore.RED}Failed to initialize AWS clients. Setup incomplete.{Style.RESET_ALL}\n"
+            )
             return
 
-        if self.service_type == 'managed':
+        if self.service_type == "managed":
             if not self.opensearch_endpoint:
-                print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
+                print(
+                    f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n"
+                )
                 return
             else:
                 self.opensearch_domain_name = self.get_opensearch_domain_name()
-        elif self.service_type == 'open-source':
+        elif self.service_type == "open-source":
             # Open-source setup
             if not self.opensearch_endpoint:
-                print(f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n")
+                print(
+                    f"\n{Fore.RED}OpenSearch endpoint not set. Setup incomplete.{Style.RESET_ALL}\n"
+                )
                 return
             else:
                 self.opensearch_domain_name = None
@@ -556,79 +677,113 @@ def setup_command(self):
             print("2. Use an existing KNN index")
             index_choice = input("Enter your choice (1-2): ").strip()
 
-            if index_choice == '1':
-                self.index_name = input("\nEnter a name for your new KNN index in OpenSearch: ").strip()
-                self.config['index_name'] = self.index_name
+            if index_choice == "1":
+                self.index_name = input(
+                    "\nEnter a name for your new KNN index in OpenSearch: "
+                ).strip()
+                self.config["index_name"] = self.index_name
                 self.save_config(self.config)
 
                 print("\nProceeding with index creation...\n")
-                embedding_dimension, space_type, ef_construction, number_of_shards, number_of_replicas, \
-                passage_text_field, passage_chunk_field, embedding_field = self.get_knn_index_details()
+                (
+                    embedding_dimension,
+                    space_type,
+                    ef_construction,
+                    number_of_shards,
+                    number_of_replicas,
+                    passage_text_field,
+                    passage_chunk_field,
+                    embedding_field,
+                ) = self.get_knn_index_details()
 
                 self.opensearch_connector = OpenSearchConnector(self.config)
                 self.opensearch_connector.opensearch_client = self.opensearch_client
                 self.opensearch_connector.index_name = self.index_name
 
                 if self.opensearch_connector.verify_and_create_index(
-                    embedding_dimension, space_type, ef_construction, number_of_shards,
-                    number_of_replicas, passage_text_field, passage_chunk_field, embedding_field
+                    embedding_dimension,
+                    space_type,
+                    ef_construction,
+                    number_of_shards,
+                    number_of_replicas,
+                    passage_text_field,
+                    passage_chunk_field,
+                    embedding_field,
                 ):
-                    print(f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n")
+                    print(
+                        f"\n{Fore.GREEN}KNN index '{self.index_name}' created successfully.{Style.RESET_ALL}\n"
+                    )
                     # Save index details
-                    self.config['embedding_dimension'] = str(embedding_dimension)
-                    self.config['space_type'] = space_type
-                    self.config['ef_construction'] = str(ef_construction)
-                    self.config['number_of_shards'] = str(number_of_shards)
-                    self.config['number_of_replicas'] = str(number_of_replicas)
-                    self.config['passage_text_field'] = passage_text_field
-                    self.config['passage_chunk_field'] = passage_chunk_field
-                    self.config['embedding_field'] = embedding_field
+                    self.config["embedding_dimension"] = str(embedding_dimension)
+                    self.config["space_type"] = space_type
+                    self.config["ef_construction"] = str(ef_construction)
+                    self.config["number_of_shards"] = str(number_of_shards)
+                    self.config["number_of_replicas"] = str(number_of_replicas)
+                    self.config["passage_text_field"] = passage_text_field
+                    self.config["passage_chunk_field"] = passage_chunk_field
+                    self.config["embedding_field"] = embedding_field
                     self.save_config(self.config)
                 else:
-                    print(f"\n{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n")
+                    print(
+                        f"\n{Fore.RED}Index creation failed. Please check your permissions and try again.{Style.RESET_ALL}\n"
+                    )
                     return
-            elif index_choice == '2':
-                existing_index_name = input("\nEnter the name of your existing KNN index: ").strip()
+            elif index_choice == "2":
+                existing_index_name = input(
+                    "\nEnter the name of your existing KNN index: "
+                ).strip()
                 if not existing_index_name:
-                    print(f"\n{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n")
+                    print(
+                        f"\n{Fore.RED}Index name cannot be empty. Aborting.{Style.RESET_ALL}\n"
+                    )
                     return
                 self.index_name = existing_index_name
-                self.config['index_name'] = self.index_name
+                self.config["index_name"] = self.index_name
                 self.save_config(self.config)
 
                 # Verify that the index exists
                 try:
                     if not self.opensearch_client.indices.exists(index=self.index_name):
-                        print(f"\n{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n")
+                        print(
+                            f"\n{Fore.RED}Index '{self.index_name}' does not exist in OpenSearch. Aborting.{Style.RESET_ALL}\n"
+                        )
                         return
                     else:
-                        print(f"\n{Fore.GREEN}Index '{self.index_name}' exists in OpenSearch.{Style.RESET_ALL}\n")
+                        print(
+                            f"\n{Fore.GREEN}Index '{self.index_name}' exists in OpenSearch.{Style.RESET_ALL}\n"
+                        )
                         # Attempt to retrieve index settings and mappings
-                        index_info = self.opensearch_client.indices.get(index=self.index_name)
-                        settings = index_info[self.index_name]['settings']['index']
-                        mappings = index_info[self.index_name]['mappings']['properties']
+                        index_info = self.opensearch_client.indices.get(
+                            index=self.index_name
+                        )
+                        settings = index_info[self.index_name]["settings"]["index"]
+                        mappings = index_info[self.index_name]["mappings"]["properties"]
 
                         # Attempt to retrieve known fields
                         # For simplicity, assume defaults if they don't exist
-                        embedding_field = 'passage_embedding'
+                        embedding_field = "passage_embedding"
                         embedding_field_mappings = mappings.get(embedding_field, {})
-                        knn_mappings = embedding_field_mappings.get('method', {})
+                        embedding_field_mappings.get("method", {})
                         # These values might not be perfectly retrievable depending on the index mapping
                         # We'll do best-effort.
                         embedding_dimension = 768
-                        space_type = 'l2'
+                        space_type = "l2"
                         ef_construction = 512
-                        if 'method' in embedding_field_mappings:
-                            method = embedding_field_mappings['method']
-                            space_type = method.get('space_type', 'l2')
-                            ef_construction = method.get('parameters', {}).get('ef_construction', 512)
-
-                        number_of_shards = settings.get('number_of_shards', '2')
-                        number_of_replicas = settings.get('number_of_replicas', '2')
-                        passage_text_field = 'passage_text'
-                        passage_chunk_field = 'passage_chunk'
-
-                        print(f"\nUsing existing index '{self.index_name}' with the following settings:")
+                        if "method" in embedding_field_mappings:
+                            method = embedding_field_mappings["method"]
+                            space_type = method.get("space_type", "l2")
+                            ef_construction = method.get("parameters", {}).get(
+                                "ef_construction", 512
+                            )
+
+                        number_of_shards = settings.get("number_of_shards", "2")
+                        number_of_replicas = settings.get("number_of_replicas", "2")
+                        passage_text_field = "passage_text"
+                        passage_chunk_field = "passage_chunk"
+
+                        print(
+                            f"\nUsing existing index '{self.index_name}' with the following settings:"
+                        )
                         print(f"Embedding Dimension: {embedding_dimension}")
                         print(f"Space Type: {space_type}")
                         print(f"ef_construction: {ef_construction}")
@@ -639,34 +794,41 @@ def setup_command(self):
                         print(f"Embedding Field: '{embedding_field}'\n")
 
                         # Save index details
-                        self.config['embedding_dimension'] = str(embedding_dimension)
-                        self.config['space_type'] = space_type
-                        self.config['ef_construction'] = str(ef_construction)
-                        self.config['number_of_shards'] = str(number_of_shards)
-                        self.config['number_of_replicas'] = str(number_of_replicas)
-                        self.config['passage_text_field'] = passage_text_field
-                        self.config['passage_chunk_field'] = passage_chunk_field
-                        self.config['embedding_field'] = embedding_field
+                        self.config["embedding_dimension"] = str(embedding_dimension)
+                        self.config["space_type"] = space_type
+                        self.config["ef_construction"] = str(ef_construction)
+                        self.config["number_of_shards"] = str(number_of_shards)
+                        self.config["number_of_replicas"] = str(number_of_replicas)
+                        self.config["passage_text_field"] = passage_text_field
+                        self.config["passage_chunk_field"] = passage_chunk_field
+                        self.config["embedding_field"] = embedding_field
                         self.save_config(self.config)
 
                 except Exception as ex:
-                    print(f"\n{Fore.RED}Error retrieving index details: {ex}{Style.RESET_ALL}\n")
+                    print(
+                        f"\n{Fore.RED}Error retrieving index details: {ex}{Style.RESET_ALL}\n"
+                    )
                     return
 
             # Proceed with model registration if managed and semantic_with_llm
             self.model_register = ModelRegister(
-                self.config,
-                self.opensearch_client,
-                self.opensearch_domain_name
+                self.config, self.opensearch_client, self.opensearch_domain_name
             )
 
-            if self.service_type == 'managed' and self.config['default_search_method'] == 'semantic_with_llm':
+            if (
+                self.service_type == "managed"
+                and self.config["default_search_method"] == "semantic_with_llm"
+            ):
                 # Managed OpenSearch: Proceed with model registration for LLM
                 self.model_register.prompt_model_registration()
             else:
                 # Open-source or semantic without LLM: no model registration needed
-                print(f"{Fore.GREEN}Setup complete. No LLM model registration required.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.GREEN}Setup complete. No LLM model registration required.{Style.RESET_ALL}"
+                )
 
         else:
             # Handle failure to initialize OpenSearch client
-            print(f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n")
+            print(
+                f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n"
+            )
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
index 4e0d8479..cfcb2352 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
@@ -5,13 +5,12 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import boto3
-import botocore
 import json
 import time
-from urllib.parse import urlparse
+
 from colorama import Fore, Style
 
+
 class Serverless:
     def __init__(self, aoss_client, collection_name, iam_principal, aws_region):
         """
@@ -31,29 +30,73 @@ def create_security_policies(self):
         """
         Create security policies for serverless OpenSearch.
         """
-        encryption_policy = json.dumps({
-            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
-            "AWSOwnedKey": True
-        })
-        
-        network_policy = json.dumps([{
-            "Rules": [{"Resource": [f"collection/{self.collection_name}"], "ResourceType": "collection"}],
-            "AllowFromPublic": True
-        }])
-        
-        data_access_policy = json.dumps([{
-            "Rules": [
-                {"Resource": ["collection/*"], "Permission": ["aoss:*"], "ResourceType": "collection"},
-                {"Resource": ["index/*/*"], "Permission": ["aoss:*"], "ResourceType": "index"}
-            ],
-            "Principal": [self.iam_principal],
-            "Description": f"Data access policy for {self.collection_name}"
-        }])
-        
-        encryption_policy_name = self.get_truncated_name(f"{self.collection_name}-enc-policy")
-        self.create_security_policy("encryption", encryption_policy_name, f"{self.collection_name} encryption security policy", encryption_policy)
-        self.create_security_policy("network", f"{self.collection_name}-net-policy", f"{self.collection_name} network security policy", network_policy)
-        self.create_access_policy(self.get_truncated_name(f"{self.collection_name}-access-policy"), f"{self.collection_name} data access policy", data_access_policy)
+        encryption_policy = json.dumps(
+            {
+                "Rules": [
+                    {
+                        "Resource": [f"collection/{self.collection_name}"],
+                        "ResourceType": "collection",
+                    }
+                ],
+                "AWSOwnedKey": True,
+            }
+        )
+
+        network_policy = json.dumps(
+            [
+                {
+                    "Rules": [
+                        {
+                            "Resource": [f"collection/{self.collection_name}"],
+                            "ResourceType": "collection",
+                        }
+                    ],
+                    "AllowFromPublic": True,
+                }
+            ]
+        )
+
+        data_access_policy = json.dumps(
+            [
+                {
+                    "Rules": [
+                        {
+                            "Resource": ["collection/*"],
+                            "Permission": ["aoss:*"],
+                            "ResourceType": "collection",
+                        },
+                        {
+                            "Resource": ["index/*/*"],
+                            "Permission": ["aoss:*"],
+                            "ResourceType": "index",
+                        },
+                    ],
+                    "Principal": [self.iam_principal],
+                    "Description": f"Data access policy for {self.collection_name}",
+                }
+            ]
+        )
+
+        encryption_policy_name = self.get_truncated_name(
+            f"{self.collection_name}-enc-policy"
+        )
+        self.create_security_policy(
+            "encryption",
+            encryption_policy_name,
+            f"{self.collection_name} encryption security policy",
+            encryption_policy,
+        )
+        self.create_security_policy(
+            "network",
+            f"{self.collection_name}-net-policy",
+            f"{self.collection_name} network security policy",
+            network_policy,
+        )
+        self.create_access_policy(
+            self.get_truncated_name(f"{self.collection_name}-access-policy"),
+            f"{self.collection_name} data access policy",
+            data_access_policy,
+        )
 
     def create_security_policy(self, policy_type, name, description, policy_body):
         """
@@ -70,22 +113,28 @@ def create_security_policy(self, policy_type, name, description, policy_body):
                     description=description,
                     name=name,
                     policy=policy_body,
-                    type="encryption"
+                    type="encryption",
                 )
             elif policy_type.lower() == "network":
                 self.aoss_client.create_security_policy(
                     description=description,
                     name=name,
                     policy=policy_body,
-                    type="network"
+                    type="network",
                 )
             else:
                 raise ValueError("Invalid policy type specified.")
-            print(f"{Fore.GREEN}{policy_type.capitalize()} Policy '{name}' created successfully.{Style.RESET_ALL}")
+            print(
+                f"{Fore.GREEN}{policy_type.capitalize()} Policy '{name}' created successfully.{Style.RESET_ALL}"
+            )
         except self.aoss_client.exceptions.ConflictException:
-            print(f"{Fore.YELLOW}{policy_type.capitalize()} Policy '{name}' already exists.{Style.RESET_ALL}")
+            print(
+                f"{Fore.YELLOW}{policy_type.capitalize()} Policy '{name}' already exists.{Style.RESET_ALL}"
+            )
         except Exception as ex:
-            print(f"{Fore.RED}Error creating {policy_type} policy '{name}': {ex}{Style.RESET_ALL}")
+            print(
+                f"{Fore.RED}Error creating {policy_type} policy '{name}': {ex}{Style.RESET_ALL}"
+            )
 
     def create_access_policy(self, name, description, policy_body):
         """
@@ -97,16 +146,19 @@ def create_access_policy(self, name, description, policy_body):
         """
         try:
             self.aoss_client.create_access_policy(
-                description=description,
-                name=name,
-                policy=policy_body,
-                type="data"
+                description=description, name=name, policy=policy_body, type="data"
+            )
+            print(
+                f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n"
             )
-            print(f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n")
         except self.aoss_client.exceptions.ConflictException:
-            print(f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n"
+            )
         except Exception as ex:
-            print(f"{Fore.RED}Error creating data access policy '{name}': {ex}{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.RED}Error creating data access policy '{name}': {ex}{Style.RESET_ALL}\n"
+            )
 
     def create_collection(self, collection_name, max_retries=3):
         """
@@ -121,15 +173,21 @@ def create_collection(self, collection_name, max_retries=3):
                 response = self.aoss_client.create_collection(
                     description=f"{collection_name} collection",
                     name=collection_name,
-                    type="VECTORSEARCH"
+                    type="VECTORSEARCH",
+                )
+                print(
+                    f"{Fore.GREEN}Collection '{collection_name}' creation initiated.{Style.RESET_ALL}"
                 )
-                print(f"{Fore.GREEN}Collection '{collection_name}' creation initiated.{Style.RESET_ALL}")
-                return response['createCollectionDetail']['id']
+                return response["createCollectionDetail"]["id"]
             except self.aoss_client.exceptions.ConflictException:
-                print(f"{Fore.YELLOW}Collection '{collection_name}' already exists.{Style.RESET_ALL}")
+                print(
+                    f"{Fore.YELLOW}Collection '{collection_name}' already exists.{Style.RESET_ALL}"
+                )
                 return self.get_collection_id(collection_name)
             except Exception as ex:
-                print(f"{Fore.RED}Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}{Style.RESET_ALL}"
+                )
                 if attempt == max_retries - 1:
                     return None
                 time.sleep(5)
@@ -144,9 +202,9 @@ def get_collection_id(self, collection_name):
         """
         try:
             response = self.aoss_client.list_collections()
-            for collection in response.get('collectionSummaries', []):
-                if collection.get('name') == collection_name:
-                    return collection.get('id')
+            for collection in response.get("collectionSummaries", []):
+                if collection.get("name") == collection_name:
+                    return collection.get("id")
         except Exception as ex:
             print(f"{Fore.RED}Error getting collection ID: {ex}{Style.RESET_ALL}")
         return None
@@ -164,20 +222,28 @@ def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
         while time.time() - start_time < max_wait_minutes * 60:
             try:
                 response = self.aoss_client.batch_get_collection(ids=[collection_id])
-                status = response['collectionDetails'][0]['status']
-                if status == 'ACTIVE':
-                    print(f"{Fore.GREEN}Collection '{self.collection_name}' is now active.{Style.RESET_ALL}\n")
+                status = response["collectionDetails"][0]["status"]
+                if status == "ACTIVE":
+                    print(
+                        f"{Fore.GREEN}Collection '{self.collection_name}' is now active.{Style.RESET_ALL}\n"
+                    )
                     return True
-                elif status in ['FAILED', 'DELETED']:
-                    print(f"{Fore.RED}Collection creation failed or was deleted. Status: {status}{Style.RESET_ALL}\n")
+                elif status in ["FAILED", "DELETED"]:
+                    print(
+                        f"{Fore.RED}Collection creation failed or was deleted. Status: {status}{Style.RESET_ALL}\n"
+                    )
                     return False
                 else:
                     print(f"Collection status: {status}. Waiting...")
                     time.sleep(30)
             except Exception as ex:
-                print(f"{Fore.RED}Error checking collection status: {ex}{Style.RESET_ALL}")
+                print(
+                    f"{Fore.RED}Error checking collection status: {ex}{Style.RESET_ALL}"
+                )
                 time.sleep(30)
-        print(f"{Fore.RED}Timed out waiting for collection to become active after {max_wait_minutes} minutes.{Style.RESET_ALL}\n")
+        print(
+            f"{Fore.RED}Timed out waiting for collection to become active after {max_wait_minutes} minutes.{Style.RESET_ALL}\n"
+        )
         return False
 
     def get_collection_endpoint(self):
@@ -189,25 +255,37 @@ def get_collection_endpoint(self):
         try:
             collection_id = self.get_collection_id(self.collection_name)
             if not collection_id:
-                print(f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n")
+                print(
+                    f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n"
+                )
                 return None
-            
-            batch_get_response = self.aoss_client.batch_get_collection(ids=[collection_id])
-            collection_details = batch_get_response.get('collectionDetails', [])
-            
+
+            batch_get_response = self.aoss_client.batch_get_collection(
+                ids=[collection_id]
+            )
+            collection_details = batch_get_response.get("collectionDetails", [])
+
             if not collection_details:
-                print(f"{Fore.RED}No details found for collection ID '{collection_id}'.{Style.RESET_ALL}\n")
+                print(
+                    f"{Fore.RED}No details found for collection ID '{collection_id}'.{Style.RESET_ALL}\n"
+                )
                 return None
-            
-            endpoint = collection_details[0].get('collectionEndpoint')
+
+            endpoint = collection_details[0].get("collectionEndpoint")
             if endpoint:
-                print(f"Collection '{self.collection_name}' has endpoint URL: {endpoint}\n")
+                print(
+                    f"Collection '{self.collection_name}' has endpoint URL: {endpoint}\n"
+                )
                 return endpoint
             else:
-                print(f"{Fore.RED}No endpoint URL found in collection '{self.collection_name}'.{Style.RESET_ALL}\n")
+                print(
+                    f"{Fore.RED}No endpoint URL found in collection '{self.collection_name}'.{Style.RESET_ALL}\n"
+                )
                 return None
         except Exception as ex:
-            print(f"{Fore.RED}Error retrieving collection endpoint: {ex}{Style.RESET_ALL}\n")
+            print(
+                f"{Fore.RED}Error retrieving collection endpoint: {ex}{Style.RESET_ALL}\n"
+            )
             return None
 
     @staticmethod
@@ -221,4 +299,4 @@ def get_truncated_name(base_name, max_length=32):
         """
         if len(base_name) <= max_length:
             return base_name
-        return base_name[:max_length-3] + "..."
\ No newline at end of file
+        return base_name[: max_length - 3] + "..."
diff --git a/setup.py b/setup.py
index f935df39..4130e165 100644
--- a/setup.py
+++ b/setup.py
@@ -5,7 +5,6 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-
 #  Licensed to Elasticsearch B.V. under one or more contributor
 #  license agreements. See the NOTICE file distributed with
 #  this work for additional information regarding copyright
@@ -111,8 +110,8 @@
     extras_require=extras,
     # Entry points for console scripts
     entry_points={
-        'console_scripts': [
-            'rag=opensearch_py_ml.ml_commons.rag_pipeline.rag.rag:main',
+        "console_scripts": [
+            "rag=opensearch_py_ml.ml_commons.rag_pipeline.rag.rag:main",
         ],
     },
-)
\ No newline at end of file
+)
diff --git a/tests/rag/test_AiConnectorClass.py b/tests/rag/test_AiConnectorClass.py
index db5d73dd..e4776da5 100644
--- a/tests/rag/test_AiConnectorClass.py
+++ b/tests/rag/test_AiConnectorClass.py
@@ -5,32 +5,51 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import unittest
-from unittest.mock import patch, MagicMock
 import json
-import requests
+import unittest
+from unittest.mock import MagicMock, patch
+
+from requests.auth import HTTPBasicAuth
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import (
+    AIConnectorHelper,
+)
 
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper import AIConnectorHelper
 
 class TestAIConnectorHelper(unittest.TestCase):
     def setUp(self):
-        self.region = 'us-east-1'
-        self.opensearch_domain_name = 'test-domain'
-        self.opensearch_domain_username = 'admin'
-        self.opensearch_domain_password = 'password'
-        self.aws_user_name = 'test-user'
-        self.aws_role_name = 'test-role'
-
-        self.domain_endpoint = 'search-test-domain.us-east-1.es.amazonaws.com'
-        self.domain_arn = 'arn:aws:es:us-east-1:123456789012:domain/test-domain'
-
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AIConnectorHelper.get_opensearch_domain_info')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.OpenSearch')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.SecretHelper')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.IAMRoleHelper')
-    def test___init__(self, mock_iam_role_helper, mock_secret_helper, mock_opensearch, mock_get_opensearch_domain_info):
+        self.region = "us-east-1"
+        self.opensearch_domain_name = "test-domain"
+        self.opensearch_domain_username = "admin"
+        self.opensearch_domain_password = "password"
+        self.aws_user_name = "test-user"
+        self.aws_role_name = "test-role"
+
+        self.domain_endpoint = "search-test-domain.us-east-1.es.amazonaws.com"
+        self.domain_arn = "arn:aws:es:us-east-1:123456789012:domain/test-domain"
+
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AIConnectorHelper.get_opensearch_domain_info"
+    )
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.OpenSearch")
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.SecretHelper"
+    )
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.IAMRoleHelper"
+    )
+    def test___init__(
+        self,
+        mock_iam_role_helper,
+        mock_secret_helper,
+        mock_opensearch,
+        mock_get_opensearch_domain_info,
+    ):
         # Mock get_opensearch_domain_info
-        mock_get_opensearch_domain_info.return_value = (self.domain_endpoint, self.domain_arn)
+        mock_get_opensearch_domain_info.return_value = (
+            self.domain_endpoint,
+            self.domain_arn,
+        )
 
         # Instantiate AIConnectorHelper
         helper = AIConnectorHelper(
@@ -39,20 +58,24 @@ def test___init__(self, mock_iam_role_helper, mock_secret_helper, mock_opensearc
             self.opensearch_domain_username,
             self.opensearch_domain_password,
             self.aws_user_name,
-            self.aws_role_name
+            self.aws_role_name,
+            f"https://{self.domain_endpoint}",  # Add this line
         )
 
         # Assert domain URL
-        expected_domain_url = f'https://{self.domain_endpoint}'
+        expected_domain_url = f"https://{self.domain_endpoint}"
         self.assertEqual(helper.opensearch_domain_url, expected_domain_url)
 
         # Assert opensearch_client is initialized
         mock_opensearch.assert_called_once_with(
-            hosts=[{'host': self.domain_endpoint, 'port': 443}],
-            http_auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+            hosts=[{"host": self.domain_endpoint, "port": 443}],
+            http_auth=(
+                self.opensearch_domain_username,
+                self.opensearch_domain_password,
+            ),
             use_ssl=True,
             verify_certs=True,
-            connection_class=unittest.mock.ANY
+            connection_class=unittest.mock.ANY,
         )
 
         # Assert IAMRoleHelper and SecretHelper are initialized
@@ -63,11 +86,11 @@ def test___init__(self, mock_iam_role_helper, mock_secret_helper, mock_opensearc
             opensearch_domain_password=self.opensearch_domain_password,
             aws_user_name=self.aws_user_name,
             aws_role_name=self.aws_role_name,
-            opensearch_domain_arn=self.domain_arn
+            opensearch_domain_arn=self.domain_arn,
         )
         mock_secret_helper.assert_called_once_with(self.region)
 
-    @patch('boto3.client')
+    @patch("boto3.client")
     def test_get_opensearch_domain_info_success(self, mock_boto3_client):
         # Mock the boto3 client
         mock_client_instance = MagicMock()
@@ -75,55 +98,60 @@ def test_get_opensearch_domain_info_success(self, mock_boto3_client):
 
         # Mock the describe_domain response
         mock_client_instance.describe_domain.return_value = {
-            'DomainStatus': {
-                'Endpoint': self.domain_endpoint,
-                'ARN': self.domain_arn
-            }
+            "DomainStatus": {"Endpoint": self.domain_endpoint, "ARN": self.domain_arn}
         }
 
         # Call the method
-        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(
+            self.region, self.opensearch_domain_name
+        )
 
         # Assert the results
         self.assertEqual(endpoint, self.domain_endpoint)
         self.assertEqual(arn, self.domain_arn)
-        mock_client_instance.describe_domain.assert_called_once_with(DomainName=self.opensearch_domain_name)
+        mock_client_instance.describe_domain.assert_called_once_with(
+            DomainName=self.opensearch_domain_name
+        )
 
-    @patch('boto3.client')
+    @patch("boto3.client")
     def test_get_opensearch_domain_info_exception(self, mock_boto3_client):
         # Mock the boto3 client to raise an exception
         mock_client_instance = MagicMock()
         mock_boto3_client.return_value = mock_client_instance
-        mock_client_instance.describe_domain.side_effect = Exception('Test Exception')
+        mock_client_instance.describe_domain.side_effect = Exception("Test Exception")
 
         # Call the method
-        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(self.region, self.opensearch_domain_name)
+        endpoint, arn = AIConnectorHelper.get_opensearch_domain_info(
+            self.region, self.opensearch_domain_name
+        )
 
         # Assert the results are None
         self.assertIsNone(endpoint)
         self.assertIsNone(arn)
 
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    @patch.object(AIConnectorHelper, "iam_helper", create=True)
     def test_get_ml_auth_success(self, mock_iam_helper):
         # Mock the get_role_arn to return a role ARN
-        create_connector_role_name = 'test-create-connector-role'
-        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        create_connector_role_name = "test-create-connector-role"
+        create_connector_role_arn = (
+            "arn:aws:iam::123456789012:role/test-create-connector-role"
+        )
         mock_iam_helper.get_role_arn.return_value = create_connector_role_arn
 
         # Mock the assume_role to return temp credentials
         temp_credentials = {
             "AccessKeyId": "test-access-key",
             "SecretAccessKey": "test-secret-key",
-            "SessionToken": "test-session-token"
+            "SessionToken": "test-session-token",
         }
         mock_iam_helper.assume_role.return_value = temp_credentials
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
             helper.region = self.region
             helper.iam_helper = mock_iam_helper
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
             helper.opensearch_domain_arn = self.domain_arn
 
             # Call the method
@@ -136,14 +164,14 @@ def test_get_ml_auth_success(self, mock_iam_helper):
             # Since AWS4Auth is instantiated within the method, we can check if awsauth is not None
             self.assertIsNotNone(awsauth)
 
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
+    @patch.object(AIConnectorHelper, "iam_helper", create=True)
     def test_get_ml_auth_role_not_found(self, mock_iam_helper):
         # Mock the get_role_arn to return None
-        create_connector_role_name = 'test-create-connector-role'
+        create_connector_role_name = "test-create-connector-role"
         mock_iam_helper.get_role_arn.return_value = None
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
             helper.iam_helper = mock_iam_helper
 
@@ -151,20 +179,25 @@ def test_get_ml_auth_role_not_found(self, mock_iam_helper):
             with self.assertRaises(Exception) as context:
                 helper.get_ml_auth(create_connector_role_name)
 
-            self.assertTrue(f"IAM role '{create_connector_role_name}' not found." in str(context.exception))
+            self.assertTrue(
+                f"IAM role '{create_connector_role_name}' not found."
+                in str(context.exception)
+            )
 
-    @patch('requests.post')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AWS4Auth')
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
-    def test_create_connector(self, mock_iam_helper, mock_aws4auth, mock_requests_post):
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.OpenSearch")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.AWS4Auth")
+    @patch.object(AIConnectorHelper, "iam_helper", create=True)
+    def test_create_connector(self, mock_iam_helper, mock_aws4auth, mock_opensearch):
         # Mock the IAM helper methods
-        create_connector_role_name = 'test-create-connector-role'
-        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
+        create_connector_role_name = "test-create-connector-role"
+        create_connector_role_arn = (
+            "arn:aws:iam::123456789012:role/test-create-connector-role"
+        )
         mock_iam_helper.get_role_arn.return_value = create_connector_role_arn
         temp_credentials = {
             "AccessKeyId": "test-access-key",
             "SecretAccessKey": "test-secret-key",
-            "SessionToken": "test-session-token"
+            "SessionToken": "test-session-token",
         }
         mock_iam_helper.assume_role.return_value = temp_credentials
 
@@ -172,161 +205,175 @@ def test_create_connector(self, mock_iam_helper, mock_aws4auth, mock_requests_po
         mock_awsauth = MagicMock()
         mock_aws4auth.return_value = mock_awsauth
 
-        # Mock requests.post
-        response = MagicMock()
-        response.text = json.dumps({'connector_id': 'test-connector-id'})
-        mock_requests_post.return_value = response
+        # Mock OpenSearch client
+        mock_os_client = MagicMock()
+        mock_opensearch.return_value = mock_os_client
+        mock_os_client.transport.perform_request.return_value = (
+            200,
+            {},
+            '{"connector_id": "test-connector-id"}',
+        )
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
             helper.region = self.region
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
             helper.iam_helper = mock_iam_helper
 
-            # Call the method
-            payload = {'key': 'value'}
-            connector_id = helper.create_connector(create_connector_role_name, payload)
-
-            # Assert that the correct URL was used
-            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/connectors/_create'
-            mock_requests_post.assert_called_once_with(
-                expected_url,
-                auth=mock_awsauth,
-                json=payload,
-                headers={"Content-Type": "application/json"}
-            )
+            # Mock the Connector class
+            mock_connector = MagicMock()
+            mock_connector.create_standalone_connector.return_value = {
+                "connector_id": "test-connector-id"
+            }
+            with patch(
+                "opensearch_py_ml.ml_commons.rag_pipeline.rag.AIConnectorHelper.Connector",
+                return_value=mock_connector,
+            ):
+                # Call the method
+                payload = {"key": "value"}
+                connector_id = helper.create_connector(
+                    create_connector_role_name, payload
+                )
+
+            # Assert that create_standalone_connector was called with the correct arguments
+            mock_connector.create_standalone_connector.assert_called_once_with(payload)
 
             # Assert that the connector_id is returned
-            self.assertEqual(connector_id, 'test-connector-id')
+            self.assertEqual(connector_id, "test-connector-id")
 
-    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
-    def test_search_model_group(self, mock_model_access_control):
-        # Mock the response from model_access_control.search_model_group_by_name
-        model_group_name = 'test-model-group'
-        mock_response = {'hits': {'hits': []}}
-        mock_model_access_control.search_model_group_by_name.return_value = mock_response
+    @patch("requests.post")
+    @patch.object(AIConnectorHelper, "get_ml_auth")
+    @patch.object(AIConnectorHelper, "get_task")
+    def test_create_model(self, mock_get_task, mock_get_ml_auth, mock_requests_post):
+        # Mock get_ml_auth
+        mock_awsauth = MagicMock()
+        mock_get_ml_auth.return_value = mock_awsauth
+
+        # Mock requests.post
+        mock_response = MagicMock()
+        mock_response.text = json.dumps({"task_id": "test-task-id"})
+        mock_requests_post.return_value = mock_response
+
+        # Mock get_task
+        mock_get_task.return_value = {"model_id": "test-model-id"}
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.model_access_control = mock_model_access_control
+            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
+            helper.model_access_control = MagicMock()
+            helper.model_access_control.get_model_group_id_by_name.return_value = (
+                "test-model-group-id"
+            )
 
             # Call the method
-            response = helper.search_model_group(model_group_name, 'test-create-connector-role')
+            model_id = helper.create_model(
+                "test-model",
+                "test description",
+                "test-connector-id",
+                "test-create-connector-role",
+                deploy=True,
+            )
 
-            # Assert that the method was called with correct parameters
-            mock_model_access_control.search_model_group_by_name.assert_called_once_with(model_group_name, size=1)
+            # Assert that the correct URL was used
+            expected_url = f"{helper.opensearch_domain_url}/_plugins/_ml/models/_register?deploy=true"
+            mock_requests_post.assert_called_once_with(
+                expected_url,
+                auth=mock_awsauth,
+                json={
+                    "name": "test-model",
+                    "function_name": "remote",
+                    "description": "test description",
+                    "model_group_id": "test-model-group-id",
+                    "connector_id": "test-connector-id",
+                },
+                headers={"Content-Type": "application/json"},
+            )
 
-            # Assert that the response is as expected
-            self.assertEqual(response, mock_response)
+            # Assert that get_task was called
+            mock_get_task.assert_called_once_with(
+                "test-task-id", "test-create-connector-role"
+            )
+
+            # Assert that model_id is returned
+            self.assertEqual(model_id, "test-model-id")
 
-    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
-    def test_create_model_group_exists(self, mock_model_access_control):
+    def test_create_model_group_exists(self):
         # Mock the get_model_group_id_by_name to return an ID
-        model_group_name = 'test-model-group'
-        model_group_id = 'test-model-group-id'
-        mock_model_access_control.get_model_group_id_by_name.return_value = model_group_id
+        model_group_name = "test-model-group"
+        model_group_id = "test-model-group-id"
 
-        # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.model_access_control = mock_model_access_control
+            helper.model_access_control = MagicMock()
+            helper.model_access_control.get_model_group_id_by_name.return_value = (
+                model_group_id
+            )
 
             # Call the method
-            result = helper.create_model_group(model_group_name, 'test description', 'test-create-connector-role')
+            result = helper.model_access_control.get_model_group_id_by_name(
+                model_group_name
+            )
 
             # Assert that the ID is returned
             self.assertEqual(result, model_group_id)
 
-    @patch.object(AIConnectorHelper, 'model_access_control', create=True)
-    def test_create_model_group_new(self, mock_model_access_control):
+    def test_create_model_group_new(self):
         # Mock the get_model_group_id_by_name to return None initially, then an ID
-        model_group_name = 'test-model-group'
-        model_group_id = 'test-model-group-id'
-
-        # First call returns None, second call returns the ID
-        mock_model_access_control.get_model_group_id_by_name.side_effect = [None, model_group_id]
+        model_group_name = "test-model-group"
+        model_group_id = "test-model-group-id"
 
-        # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.model_access_control = mock_model_access_control
-
-            # Call the method
-            result = helper.create_model_group(model_group_name, 'test description', 'test-create-connector-role')
+            helper.model_access_control = MagicMock()
+            helper.model_access_control.get_model_group_id_by_name.side_effect = [
+                None,
+                model_group_id,
+            ]
+            helper.model_access_control.register_model_group.return_value = None
+
+            # Call the method to get or create the model group
+            result = helper.model_access_control.get_model_group_id_by_name(
+                model_group_name
+            )
+            if result is None:
+                helper.model_access_control.register_model_group(
+                    name=model_group_name, description="test description"
+                )
+                result = helper.model_access_control.get_model_group_id_by_name(
+                    model_group_name
+                )
 
             # Assert that register_model_group was called
-            mock_model_access_control.register_model_group.assert_called_once_with(name=model_group_name, description='test description')
-
-            # Assert that the ID is returned
-            self.assertEqual(result, model_group_id)
-
-    @patch.object(AIConnectorHelper, 'get_task')
-    @patch('time.sleep', return_value=None)
-    @patch('requests.post')
-    @patch.object(AIConnectorHelper, 'get_ml_auth')
-    @patch.object(AIConnectorHelper, 'create_model_group')
-    def test_create_model(self, mock_create_model_group, mock_get_ml_auth, mock_requests_post, mock_sleep, mock_get_task):
-        # Mock create_model_group
-        model_group_id = 'test-model-group-id'
-        mock_create_model_group.return_value = model_group_id
-
-        # Mock get_ml_auth
-        mock_awsauth = MagicMock()
-        mock_get_ml_auth.return_value = mock_awsauth
-
-        # Mock requests.post
-        response = MagicMock()
-        response.text = json.dumps({'model_id': 'test-model-id'})
-        mock_requests_post.return_value = response
-
-        # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
-            helper = AIConnectorHelper()
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
-
-            # Call the method
-            model_id = helper.create_model('test-model', 'test description', 'test-connector-id', 'test-create-connector-role', deploy=True)
-
-            # Assert that create_model_group was called
-            mock_create_model_group.assert_called_once_with('test-model', 'test description', 'test-create-connector-role')
+            helper.model_access_control.register_model_group.assert_called_once_with(
+                name=model_group_name, description="test description"
+            )
 
-            # Assert that the correct URL was used
-            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/_register?deploy=true'
-            payload = {
-                "name": 'test-model',
-                "function_name": "remote",
-                "description": 'test description',
-                "model_group_id": model_group_id,
-                "connector_id": 'test-connector-id'
-            }
-            mock_requests_post.assert_called_once_with(
-                expected_url,
-                auth=mock_awsauth,
-                json=payload,
-                headers={"Content-Type": "application/json"}
+            # Assert that get_model_group_id_by_name was called twice
+            self.assertEqual(
+                helper.model_access_control.get_model_group_id_by_name.call_count, 2
             )
 
-            # Assert that model_id is returned
-            self.assertEqual(model_id, 'test-model-id')
+            # Assert that the ID is returned
+        self.assertEqual(result, model_group_id)
 
-    @patch('requests.post')
+    @patch("requests.post")
     def test_deploy_model(self, mock_requests_post):
         # Mock requests.post
         response = MagicMock()
-        response.text = 'Deploy model response'
+        response.text = "Deploy model response"
         mock_requests_post.return_value = response
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
             helper.opensearch_domain_username = self.opensearch_domain_username
             helper.opensearch_domain_password = self.opensearch_domain_password
 
             # Call the method
-            result = helper.deploy_model('test-model-id')
+            result = helper.deploy_model("test-model-id")
 
             # Assert that the method was called once
             mock_requests_post.assert_called_once()
@@ -335,36 +382,37 @@ def test_deploy_model(self, mock_requests_post):
             args, kwargs = mock_requests_post.call_args
 
             # Assert URL
-            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_deploy'
+            expected_url = f"{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_deploy"
             self.assertEqual(args[0], expected_url)
 
             # Assert headers
-            self.assertEqual(kwargs['headers'], {"Content-Type": "application/json"})
+            self.assertEqual(kwargs["headers"], {"Content-Type": "application/json"})
 
             # Assert auth
-            self.assertIsInstance(kwargs['auth'], requests.auth.HTTPBasicAuth)
-            self.assertEqual(kwargs['auth'].username, self.opensearch_domain_username)
-            self.assertEqual(kwargs['auth'].password, self.opensearch_domain_password)
+            self.assertIsInstance(kwargs["auth"], HTTPBasicAuth)
+            self.assertEqual(kwargs["auth"].username, self.opensearch_domain_username)
+            self.assertEqual(kwargs["auth"].password, self.opensearch_domain_password)
 
             # Assert that the response is returned
             self.assertEqual(result, response)
-    @patch('requests.post')
+
+    @patch("requests.post")
     def test_predict(self, mock_requests_post):
         # Mock requests.post
         response = MagicMock()
-        response.text = 'Predict response'
+        response.text = "Predict response"
         mock_requests_post.return_value = response
 
         # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
+        with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
+            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
             helper.opensearch_domain_username = self.opensearch_domain_username
             helper.opensearch_domain_password = self.opensearch_domain_password
 
             # Call the method
-            payload = {'input': 'test input'}
-            result = helper.predict('test-model-id', payload)
+            payload = {"input": "test input"}
+            result = helper.predict("test-model-id", payload)
 
             # Assert that the method was called once
             mock_requests_post.assert_called_once()
@@ -373,150 +421,23 @@ def test_predict(self, mock_requests_post):
             args, kwargs = mock_requests_post.call_args
 
             # Assert URL
-            expected_url = f'{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_predict'
+            expected_url = f"{helper.opensearch_domain_url}/_plugins/_ml/models/test-model-id/_predict"
             self.assertEqual(args[0], expected_url)
 
             # Assert JSON payload
-            self.assertEqual(kwargs['json'], payload)
+            self.assertEqual(kwargs["json"], payload)
 
             # Assert headers
-            self.assertEqual(kwargs['headers'], {"Content-Type": "application/json"})
+            self.assertEqual(kwargs["headers"], {"Content-Type": "application/json"})
 
             # Assert auth
-            self.assertIsInstance(kwargs['auth'], requests.auth.HTTPBasicAuth)
-            self.assertEqual(kwargs['auth'].username, self.opensearch_domain_username)
-            self.assertEqual(kwargs['auth'].password, self.opensearch_domain_password)
+            self.assertIsInstance(kwargs["auth"], HTTPBasicAuth)
+            self.assertEqual(kwargs["auth"].username, self.opensearch_domain_username)
+            self.assertEqual(kwargs["auth"].password, self.opensearch_domain_password)
 
             # Assert that the response is returned
             self.assertEqual(result, response)
 
-    @patch('time.sleep', return_value=None)
-    @patch.object(AIConnectorHelper, 'create_connector')
-    @patch.object(AIConnectorHelper, 'secret_helper', create=True)
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
-    def test_create_connector_with_secret(self, mock_iam_helper, mock_secret_helper, mock_create_connector, mock_sleep):
-        # Mock secret_helper methods
-        secret_name = 'test-secret'
-        secret_value = 'test-secret-value'
-        secret_arn = 'arn:aws:secretsmanager:us-east-1:123456789012:secret:test-secret'
-        mock_secret_helper.secret_exists.return_value = False
-        mock_secret_helper.create_secret.return_value = secret_arn
-        mock_secret_helper.get_secret_arn.return_value = secret_arn
-
-        # Mock iam_helper methods
-        connector_role_name = 'test-connector-role'
-        create_connector_role_name = 'test-create-connector-role'
-        connector_role_arn = 'arn:aws:iam::123456789012:role/test-connector-role'
-        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
-        mock_iam_helper.role_exists.side_effect = [False, False]
-        mock_iam_helper.create_iam_role.side_effect = [connector_role_arn, create_connector_role_arn]
-        mock_iam_helper.get_user_arn.return_value = 'arn:aws:iam::123456789012:user/test-user'
-        mock_iam_helper.get_role_arn.side_effect = [connector_role_arn, create_connector_role_arn]
-        mock_iam_helper.map_iam_role_to_backend_role.return_value = None
-
-        # Mock create_connector
-        connector_id = 'test-connector-id'
-        mock_create_connector.return_value = connector_id
-
-        # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
-            helper = AIConnectorHelper()
-            helper.region = self.region
-            helper.aws_user_name = self.aws_user_name
-            helper.aws_role_name = self.aws_role_name
-            helper.opensearch_domain_arn = self.domain_arn
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
-            helper.iam_helper = mock_iam_helper
-            helper.secret_helper = mock_secret_helper
-
-            # Prepare input
-            create_connector_input = {'key': 'value'}
-
-            # Call the method
-            result = helper.create_connector_with_secret(
-                secret_name,
-                secret_value,
-                connector_role_name,
-                create_connector_role_name,
-                create_connector_input,
-                sleep_time_in_seconds=0  # For faster testing
-            )
-
-            # Assert that the methods were called
-            mock_secret_helper.secret_exists.assert_called_once_with(secret_name)
-            mock_secret_helper.create_secret.assert_called_once_with(secret_name, secret_value)
-
-            self.assertEqual(mock_iam_helper.role_exists.call_count, 2)
-            self.assertEqual(mock_iam_helper.create_iam_role.call_count, 2)
-            mock_iam_helper.map_iam_role_to_backend_role.assert_called_once_with(create_connector_role_arn)
-
-            # Assert that create_connector was called
-            payload = create_connector_input.copy()
-            payload['credential'] = {
-                "secretArn": secret_arn,
-                "roleArn": connector_role_arn
-            }
-            mock_create_connector.assert_called_once_with(create_connector_role_name, payload)
-
-            # Assert that the connector_id is returned
-            self.assertEqual(result, connector_id)
-
-    @patch('time.sleep', return_value=None)
-    @patch.object(AIConnectorHelper, 'create_connector')
-    @patch.object(AIConnectorHelper, 'iam_helper', create=True)
-    def test_create_connector_with_role(self, mock_iam_helper, mock_create_connector, mock_sleep):
-        # Mock iam_helper methods
-        connector_role_name = 'test-connector-role'
-        create_connector_role_name = 'test-create-connector-role'
-        connector_role_arn = 'arn:aws:iam::123456789012:role/test-connector-role'
-        create_connector_role_arn = 'arn:aws:iam::123456789012:role/test-create-connector-role'
-        mock_iam_helper.role_exists.side_effect = [False, False]
-        mock_iam_helper.create_iam_role.side_effect = [connector_role_arn, create_connector_role_arn]
-        mock_iam_helper.get_user_arn.return_value = 'arn:aws:iam::123456789012:user/test-user'
-        mock_iam_helper.get_role_arn.side_effect = [connector_role_arn, create_connector_role_arn]
-        mock_iam_helper.map_iam_role_to_backend_role.return_value = None
-
-        # Mock create_connector
-        connector_id = 'test-connector-id'
-        mock_create_connector.return_value = connector_id
-
-        # Instantiate helper
-        with patch.object(AIConnectorHelper, '__init__', return_value=None):
-            helper = AIConnectorHelper()
-            helper.region = self.region
-            helper.aws_user_name = self.aws_user_name
-            helper.aws_role_name = self.aws_role_name
-            helper.opensearch_domain_arn = self.domain_arn
-            helper.opensearch_domain_url = f'https://{self.domain_endpoint}'
-            helper.iam_helper = mock_iam_helper
-
-            # Prepare input
-            create_connector_input = {'key': 'value'}
-            connector_role_inline_policy = {'Statement': []}
-
-            # Call the method
-            result = helper.create_connector_with_role(
-                connector_role_inline_policy,
-                connector_role_name,
-                create_connector_role_name,
-                create_connector_input,
-                sleep_time_in_seconds=0  # For faster testing
-            )
-
-            # Assert that the methods were called
-            self.assertEqual(mock_iam_helper.role_exists.call_count, 2)
-            self.assertEqual(mock_iam_helper.create_iam_role.call_count, 2)
-            mock_iam_helper.map_iam_role_to_backend_role.assert_called_once_with(create_connector_role_arn)
-
-            # Assert that create_connector was called
-            payload = create_connector_input.copy()
-            payload['credential'] = {
-                "roleArn": connector_role_arn
-            }
-            mock_create_connector.assert_called_once_with(create_connector_role_name, payload)
-
-            # Assert that the connector_id is returned
-            self.assertEqual(result, connector_id)
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_IAMRoleHelper.py b/tests/rag/test_IAMRoleHelper.py
index d2b18eff..f0366dbd 100644
--- a/tests/rag/test_IAMRoleHelper.py
+++ b/tests/rag/test_IAMRoleHelper.py
@@ -5,92 +5,95 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import unittest
-from unittest.mock import patch, MagicMock
-from botocore.exceptions import ClientError
 import json
 import logging
+import unittest
+from unittest.mock import MagicMock, patch
+
+from botocore.exceptions import ClientError
+
+from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper
 
-# Assuming IAMRoleHelper is defined in iam_role_helper.py
-from opensearch_py_ml.ml_commons.IAMRoleHelper import IAMRoleHelper  # Replace with the actual module path if different
 
 class TestIAMRoleHelper(unittest.TestCase):
 
     def setUp(self):
-        self.region = 'us-east-1'
+        self.region = "us-east-1"
         self.iam_helper = IAMRoleHelper(region=self.region)
 
         # Configure logging to suppress error logs during tests
-        logger = logging.getLogger('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper')
+        logger = logging.getLogger("opensearch_py_ml.ml_commons.IAMRoleHelper")
         logger.setLevel(logging.CRITICAL)  # Suppress logs below CRITICAL during tests
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_role_exists_true(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
-        mock_iam_client.get_role.return_value = {'Role': {'RoleName': 'test-role'}}
+        mock_iam_client.get_role.return_value = {"Role": {"RoleName": "test-role"}}
 
-        result = self.iam_helper.role_exists('test-role')
+        result = self.iam_helper.role_exists("test-role")
 
         self.assertTrue(result)
-        mock_iam_client.get_role.assert_called_with(RoleName='test-role')
+        mock_iam_client.get_role.assert_called_with(RoleName="test-role")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_role_exists_false(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         error_response = {
-            'Error': {
-                'Code': 'NoSuchEntity',
-                'Message': 'Role does not exist'
-            }
+            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
         }
-        mock_iam_client.get_role.side_effect = ClientError(error_response, 'GetRole')
+        mock_iam_client.get_role.side_effect = ClientError(error_response, "GetRole")
 
-        result = self.iam_helper.role_exists('nonexistent-role')
+        result = self.iam_helper.role_exists("nonexistent-role")
 
         self.assertFalse(result)
-        mock_iam_client.get_role.assert_called_with(RoleName='nonexistent-role')
+        mock_iam_client.get_role.assert_called_with(RoleName="nonexistent-role")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_delete_role_success(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         # Mock responses for list_attached_role_policies and list_role_policies
         mock_iam_client.list_attached_role_policies.return_value = {
-            'AttachedPolicies': [{'PolicyArn': 'arn:aws:iam::aws:policy/ExamplePolicy'}]
+            "AttachedPolicies": [{"PolicyArn": "arn:aws:iam::aws:policy/ExamplePolicy"}]
         }
         mock_iam_client.list_role_policies.return_value = {
-            'PolicyNames': ['InlinePolicy']
+            "PolicyNames": ["InlinePolicy"]
         }
 
-        self.iam_helper.delete_role('test-role')
+        self.iam_helper.delete_role("test-role")
 
-        mock_iam_client.detach_role_policy.assert_called_with(RoleName='test-role', PolicyArn='arn:aws:iam::aws:policy/ExamplePolicy')
-        mock_iam_client.delete_role_policy.assert_called_with(RoleName='test-role', PolicyName='InlinePolicy')
-        mock_iam_client.delete_role.assert_called_with(RoleName='test-role')
+        mock_iam_client.detach_role_policy.assert_called_with(
+            RoleName="test-role", PolicyArn="arn:aws:iam::aws:policy/ExamplePolicy"
+        )
+        mock_iam_client.delete_role_policy.assert_called_with(
+            RoleName="test-role", PolicyName="InlinePolicy"
+        )
+        mock_iam_client.delete_role.assert_called_with(RoleName="test-role")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_delete_role_not_exist(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         error_response = {
-            'Error': {
-                'Code': 'NoSuchEntity',
-                'Message': 'Role does not exist'
-            }
+            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
         }
-        mock_iam_client.list_attached_role_policies.side_effect = ClientError(error_response, 'ListAttachedRolePolicies')
+        mock_iam_client.list_attached_role_policies.side_effect = ClientError(
+            error_response, "ListAttachedRolePolicies"
+        )
 
-        self.iam_helper.delete_role('nonexistent-role')
+        self.iam_helper.delete_role("nonexistent-role")
 
-        mock_iam_client.list_attached_role_policies.assert_called_with(RoleName='nonexistent-role')
+        mock_iam_client.list_attached_role_policies.assert_called_with(
+            RoleName="nonexistent-role"
+        )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_create_iam_role_success(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
@@ -99,24 +102,26 @@ def test_create_iam_role_success(self, mock_boto_client):
         inline_policy = {"Version": "2012-10-17", "Statement": []}
 
         mock_iam_client.create_role.return_value = {
-            'Role': {'Arn': 'arn:aws:iam::123456789012:role/test-role'}
+            "Role": {"Arn": "arn:aws:iam::123456789012:role/test-role"}
         }
 
-        role_arn = self.iam_helper.create_iam_role('test-role', trust_policy, inline_policy)
+        role_arn = self.iam_helper.create_iam_role(
+            "test-role", trust_policy, inline_policy
+        )
 
-        self.assertEqual(role_arn, 'arn:aws:iam::123456789012:role/test-role')
+        self.assertEqual(role_arn, "arn:aws:iam::123456789012:role/test-role")
         mock_iam_client.create_role.assert_called_with(
-            RoleName='test-role',
+            RoleName="test-role",
             AssumeRolePolicyDocument=json.dumps(trust_policy),
-            Description='Role with custom trust and inline policies',
+            Description="Role with custom trust and inline policies",
         )
         mock_iam_client.put_role_policy.assert_called_with(
-            RoleName='test-role',
-            PolicyName='InlinePolicy',
-            PolicyDocument=json.dumps(inline_policy)
+            RoleName="test-role",
+            PolicyName="InlinePolicy",
+            PolicyDocument=json.dumps(inline_policy),
         )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_create_iam_role_error(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
@@ -125,179 +130,177 @@ def test_create_iam_role_error(self, mock_boto_client):
         inline_policy = {"Version": "2012-10-17", "Statement": []}
 
         error_response = {
-            'Error': {
-                'Code': 'EntityAlreadyExists',
-                'Message': 'Role already exists'
-            }
+            "Error": {"Code": "EntityAlreadyExists", "Message": "Role already exists"}
         }
-        mock_iam_client.create_role.side_effect = ClientError(error_response, 'CreateRole')
+        mock_iam_client.create_role.side_effect = ClientError(
+            error_response, "CreateRole"
+        )
 
-        role_arn = self.iam_helper.create_iam_role('existing-role', trust_policy, inline_policy)
+        role_arn = self.iam_helper.create_iam_role(
+            "existing-role", trust_policy, inline_policy
+        )
 
         self.assertIsNone(role_arn)
         mock_iam_client.create_role.assert_called_with(
-            RoleName='existing-role',
+            RoleName="existing-role",
             AssumeRolePolicyDocument=json.dumps(trust_policy),
-            Description='Role with custom trust and inline policies',
+            Description="Role with custom trust and inline policies",
         )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_get_role_arn_success(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         mock_iam_client.get_role.return_value = {
-            'Role': {'Arn': 'arn:aws:iam::123456789012:role/test-role'}
+            "Role": {"Arn": "arn:aws:iam::123456789012:role/test-role"}
         }
 
-        role_arn = self.iam_helper.get_role_arn('test-role')
+        role_arn = self.iam_helper.get_role_arn("test-role")
 
-        self.assertEqual(role_arn, 'arn:aws:iam::123456789012:role/test-role')
-        mock_iam_client.get_role.assert_called_with(RoleName='test-role')
+        self.assertEqual(role_arn, "arn:aws:iam::123456789012:role/test-role")
+        mock_iam_client.get_role.assert_called_with(RoleName="test-role")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_get_role_arn_not_found(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         error_response = {
-            'Error': {
-                'Code': 'NoSuchEntity',
-                'Message': 'Role does not exist'
-            }
+            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
         }
-        mock_iam_client.get_role.side_effect = ClientError(error_response, 'GetRole')
+        mock_iam_client.get_role.side_effect = ClientError(error_response, "GetRole")
 
-        role_arn = self.iam_helper.get_role_arn('nonexistent-role')
+        role_arn = self.iam_helper.get_role_arn("nonexistent-role")
 
         self.assertIsNone(role_arn)
-        mock_iam_client.get_role.assert_called_with(RoleName='nonexistent-role')
+        mock_iam_client.get_role.assert_called_with(RoleName="nonexistent-role")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_get_user_arn_success(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         mock_iam_client.get_user.return_value = {
-            'User': {'Arn': 'arn:aws:iam::123456789012:user/test-user'}
+            "User": {"Arn": "arn:aws:iam::123456789012:user/test-user"}
         }
 
-        user_arn = self.iam_helper.get_user_arn('test-user')
+        user_arn = self.iam_helper.get_user_arn("test-user")
 
-        self.assertEqual(user_arn, 'arn:aws:iam::123456789012:user/test-user')
-        mock_iam_client.get_user.assert_called_with(UserName='test-user')
+        self.assertEqual(user_arn, "arn:aws:iam::123456789012:user/test-user")
+        mock_iam_client.get_user.assert_called_with(UserName="test-user")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_get_user_arn_not_found(self, mock_boto_client):
         mock_iam_client = MagicMock()
         mock_boto_client.return_value = mock_iam_client
 
         error_response = {
-            'Error': {
-                'Code': 'NoSuchEntity',
-                'Message': 'User does not exist'
-            }
+            "Error": {"Code": "NoSuchEntity", "Message": "User does not exist"}
         }
-        mock_iam_client.get_user.side_effect = ClientError(error_response, 'GetUser')
+        mock_iam_client.get_user.side_effect = ClientError(error_response, "GetUser")
 
-        user_arn = self.iam_helper.get_user_arn('nonexistent-user')
+        user_arn = self.iam_helper.get_user_arn("nonexistent-user")
 
         self.assertIsNone(user_arn)
-        mock_iam_client.get_user.assert_called_with(UserName='nonexistent-user')
+        mock_iam_client.get_user.assert_called_with(UserName="nonexistent-user")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_assume_role_success(self, mock_boto_client):
         mock_sts_client = MagicMock()
         mock_boto_client.return_value = mock_sts_client
 
         mock_sts_client.assume_role.return_value = {
-            'Credentials': {
-                'AccessKeyId': 'ASIA...',
-                'SecretAccessKey': 'secret',
-                'SessionToken': 'token'
+            "Credentials": {
+                "AccessKeyId": "ASIA...",
+                "SecretAccessKey": "secret",
+                "SessionToken": "token",
             }
         }
 
-        role_arn = 'arn:aws:iam::123456789012:role/test-role'
-        credentials = self.iam_helper.assume_role(role_arn, 'test-session')
+        role_arn = "arn:aws:iam::123456789012:role/test-role"
+        credentials = self.iam_helper.assume_role(role_arn, "test-session")
 
         self.assertIsNotNone(credentials)
-        self.assertEqual(credentials['AccessKeyId'], 'ASIA...')
+        self.assertEqual(credentials["AccessKeyId"], "ASIA...")
         mock_sts_client.assume_role.assert_called_with(
             RoleArn=role_arn,
-            RoleSessionName='test-session',
+            RoleSessionName="test-session",
         )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
     def test_assume_role_failure(self, mock_boto_client):
         mock_sts_client = MagicMock()
         mock_boto_client.return_value = mock_sts_client
 
         error_response = {
-            'Error': {
-                'Code': 'AccessDenied',
-                'Message': 'User is not authorized to perform: sts:AssumeRole'
+            "Error": {
+                "Code": "AccessDenied",
+                "Message": "User is not authorized to perform: sts:AssumeRole",
             }
         }
-        mock_sts_client.assume_role.side_effect = ClientError(error_response, 'AssumeRole')
+        mock_sts_client.assume_role.side_effect = ClientError(
+            error_response, "AssumeRole"
+        )
 
-        role_arn = 'arn:aws:iam::123456789012:role/unauthorized-role'
-        credentials = self.iam_helper.assume_role(role_arn, 'test-session')
+        role_arn = "arn:aws:iam::123456789012:role/unauthorized-role"
+        credentials = self.iam_helper.assume_role(role_arn, "test-session")
 
         self.assertIsNone(credentials)
         mock_sts_client.assume_role.assert_called_with(
             RoleArn=role_arn,
-            RoleSessionName='test-session',
+            RoleSessionName="test-session",
         )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.requests.put')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.requests.put")
     def test_map_iam_role_to_backend_role_success(self, mock_put):
         mock_response = MagicMock()
         mock_response.status_code = 200
         mock_put.return_value = mock_response
 
-        self.iam_helper.opensearch_domain_url = 'https://search-domain'
-        self.iam_helper.opensearch_domain_username = 'user'
-        self.iam_helper.opensearch_domain_password = 'pass'
+        self.iam_helper.opensearch_domain_url = "https://search-domain"
+        self.iam_helper.opensearch_domain_username = "user"
+        self.iam_helper.opensearch_domain_password = "pass"
 
-        iam_role_arn = 'arn:aws:iam::123456789012:role/test-role'
+        iam_role_arn = "arn:aws:iam::123456789012:role/test-role"
 
         self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
 
         mock_put.assert_called_once()
         args, kwargs = mock_put.call_args
-        self.assertIn('/_plugins/_security/api/rolesmapping/ml_full_access', args[0])
-        self.assertEqual(kwargs['auth'], ('user', 'pass'))
-        self.assertEqual(kwargs['json'], {'backend_roles': [iam_role_arn]})
+        self.assertIn("/_plugins/_security/api/rolesmapping/ml_full_access", args[0])
+        self.assertEqual(kwargs["auth"], ("user", "pass"))
+        self.assertEqual(kwargs["json"], {"backend_roles": [iam_role_arn]})
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.IAMRoleHelper.requests.put')
+    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.requests.put")
     def test_map_iam_role_to_backend_role_failure(self, mock_put):
         mock_response = MagicMock()
         mock_response.status_code = 403
-        mock_response.text = 'Forbidden'
+        mock_response.text = "Forbidden"
         mock_put.return_value = mock_response
 
-        self.iam_helper.opensearch_domain_url = 'https://search-domain'
-        self.iam_helper.opensearch_domain_username = 'user'
-        self.iam_helper.opensearch_domain_password = 'pass'
+        self.iam_helper.opensearch_domain_url = "https://search-domain"
+        self.iam_helper.opensearch_domain_username = "user"
+        self.iam_helper.opensearch_domain_password = "pass"
 
-        iam_role_arn = 'arn:aws:iam::123456789012:role/test-role'
+        iam_role_arn = "arn:aws:iam::123456789012:role/test-role"
 
         self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
 
         mock_put.assert_called_once()
         args, kwargs = mock_put.call_args
-        self.assertIn('/_plugins/_security/api/rolesmapping/ml_full_access', args[0])
+        self.assertIn("/_plugins/_security/api/rolesmapping/ml_full_access", args[0])
 
     def test_get_iam_user_name_from_arn_valid(self):
-        iam_principal_arn = 'arn:aws:iam::123456789012:user/test-user'
+        iam_principal_arn = "arn:aws:iam::123456789012:user/test-user"
         user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
-        self.assertEqual(user_name, 'test-user')
+        self.assertEqual(user_name, "test-user")
 
     def test_get_iam_user_name_from_arn_invalid(self):
-        iam_principal_arn = 'arn:aws:iam::123456789012:role/test-role'
+        iam_principal_arn = "arn:aws:iam::123456789012:role/test-role"
         user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
         self.assertIsNone(user_name)
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_Model_Register.py b/tests/rag/test_Model_Register.py
index 57b82deb..f94011f5 100644
--- a/tests/rag/test_Model_Register.py
+++ b/tests/rag/test_Model_Register.py
@@ -6,8 +6,7 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import patch, MagicMock, Mock
-import sys
+from unittest.mock import MagicMock, patch
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
 
@@ -16,40 +15,54 @@ class TestModelRegister(unittest.TestCase):
     def setUp(self):
         # Sample configuration dictionary
         self.config = {
-            'region': 'us-east-1',
-            'opensearch_username': 'admin',
-            'opensearch_password': 'admin',
-            'iam_principal': 'arn:aws:iam::123456789012:user/test-user',
-            'service_type': 'managed',
-            'embedding_dimension': '768',
-            'opensearch_endpoint': 'https://search-domain'
+            "region": "us-east-1",
+            "opensearch_username": "admin",
+            "opensearch_password": "admin",
+            "iam_principal": "arn:aws:iam::123456789012:user/test-user",
+            "service_type": "managed",
+            "embedding_dimension": "768",
+            "opensearch_endpoint": "https://search-domain",
         }
         # Mock OpenSearch client
         self.mock_opensearch_client = MagicMock()
         # OpenSearch domain name
-        self.opensearch_domain_name = 'test-domain'
+        self.opensearch_domain_name = "test-domain"
 
         # Correct the patch paths to match the actual module structure
-        self.patcher_iam_role_helper = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.IAMRoleHelper')
+        self.patcher_iam_role_helper = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.IAMRoleHelper"
+        )
         self.MockIAMRoleHelper = self.patcher_iam_role_helper.start()
 
-        self.patcher_ai_connector_helper = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.AIConnectorHelper')
+        self.patcher_ai_connector_helper = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.AIConnectorHelper"
+        )
         self.MockAIConnectorHelper = self.patcher_ai_connector_helper.start()
 
         # Patch model classes
-        self.patcher_bedrock_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.BedrockModel')
+        self.patcher_bedrock_model = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.BedrockModel"
+        )
         self.MockBedrockModel = self.patcher_bedrock_model.start()
 
-        self.patcher_openai_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.OpenAIModel')
+        self.patcher_openai_model = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.OpenAIModel"
+        )
         self.MockOpenAIModel = self.patcher_openai_model.start()
 
-        self.patcher_cohere_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CohereModel')
+        self.patcher_cohere_model = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CohereModel"
+        )
         self.MockCohereModel = self.patcher_cohere_model.start()
 
-        self.patcher_huggingface_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.HuggingFaceModel')
+        self.patcher_huggingface_model = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.HuggingFaceModel"
+        )
         self.MockHuggingFaceModel = self.patcher_huggingface_model.start()
 
-        self.patcher_custom_pytorch_model = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CustomPyTorchModel')
+        self.patcher_custom_pytorch_model = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.CustomPyTorchModel"
+        )
         self.MockCustomPyTorchModel = self.patcher_custom_pytorch_model.start()
 
     def tearDown(self):
@@ -61,124 +74,195 @@ def tearDown(self):
         self.patcher_huggingface_model.stop()
         self.patcher_custom_pytorch_model.stop()
 
-    @patch('boto3.client')
+    @patch("boto3.client")
     def test_initialize_clients_success(self, mock_boto_client):
         mock_boto_client.return_value = MagicMock()
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
         result = model_register.initialize_clients()
         self.assertTrue(result)
-        mock_boto_client.assert_called_with('bedrock-runtime', region_name='us-east-1')
+        mock_boto_client.assert_called_with("bedrock-runtime", region_name="us-east-1")
 
-    @patch('boto3.client')
+    @patch("boto3.client")
     def test_initialize_clients_failure(self, mock_boto_client):
-        mock_boto_client.side_effect = Exception('Client creation failed')
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        mock_boto_client.side_effect = Exception("Client creation failed")
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
         result = model_register.initialize_clients()
         self.assertFalse(result)
-        mock_boto_client.assert_called_with('bedrock-runtime', region_name='us-east-1')
+        mock_boto_client.assert_called_with("bedrock-runtime", region_name="us-east-1")
 
-    @patch('builtins.input', side_effect=['1'])
+    @patch("builtins.input", side_effect=["1"])
     def test_prompt_model_registration_register_new_model(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        with patch.object(model_register, 'register_model_interactive') as mock_register_model_interactive:
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        with patch.object(
+            model_register, "register_model_interactive"
+        ) as mock_register_model_interactive:
             model_register.prompt_model_registration()
             mock_register_model_interactive.assert_called_once()
 
-    @patch('builtins.input', side_effect=['2', 'model-id-123'])
+    @patch("builtins.input", side_effect=["2", "model-id-123"])
     def test_prompt_model_registration_use_existing_model(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        with patch.object(model_register, 'save_config') as mock_save_config:
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        with patch.object(model_register, "save_config") as mock_save_config:
             model_register.prompt_model_registration()
-            self.assertEqual(model_register.config['embedding_model_id'], 'model-id-123')
+            self.assertEqual(
+                model_register.config["embedding_model_id"], "model-id-123"
+            )
             mock_save_config.assert_called_once_with(model_register.config)
 
-    @patch('builtins.input', side_effect=['invalid'])
+    @patch("builtins.input", side_effect=["invalid"])
     def test_prompt_model_registration_invalid_choice(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
         with self.assertRaises(SystemExit):
             model_register.prompt_model_registration()
 
-    @patch('builtins.input', side_effect=['1'])
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
-    def test_register_model_interactive_bedrock(self, mock_initialize_clients, mock_input):
-        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+    @patch("builtins.input", side_effect=["1"])
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients",
+        return_value=True,
+    )
+    def test_register_model_interactive_bedrock(
+        self, mock_initialize_clients, mock_input
+    ):
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = (
+            "test-user"
+        )
 
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
         model_register.register_model_interactive()
 
         self.MockBedrockModel.return_value.register_bedrock_model.assert_called_once()
 
-    @patch('builtins.input', side_effect=['2'])
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
-    def test_register_model_interactive_openai_managed(self, mock_initialize_clients, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        model_register.service_type = 'managed'
+    @patch("builtins.input", side_effect=["2"])
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients",
+        return_value=True,
+    )
+    def test_register_model_interactive_openai_managed(
+        self, mock_initialize_clients, mock_input
+    ):
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        model_register.service_type = "managed"
 
-        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = (
+            "test-user"
+        )
 
         model_register.register_model_interactive()
 
         self.MockOpenAIModel.return_value.register_openai_model.assert_called_once()
 
-    @patch('builtins.input', side_effect=['2'])
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
-    def test_register_model_interactive_openai_opensource(self, mock_initialize_clients, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        model_register.service_type = 'open-source'
+    @patch("builtins.input", side_effect=["2"])
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients",
+        return_value=True,
+    )
+    def test_register_model_interactive_openai_opensource(
+        self, mock_initialize_clients, mock_input
+    ):
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        model_register.service_type = "open-source"
 
-        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = 'test-user'
+        self.MockIAMRoleHelper.return_value.get_iam_user_name_from_arn.return_value = (
+            "test-user"
+        )
 
         model_register.register_model_interactive()
 
         self.MockOpenAIModel.return_value.register_openai_model_opensource.assert_called_once()
 
-    @patch('builtins.input', side_effect=['invalid'])
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients', return_value=True)
-    def test_register_model_interactive_invalid_choice(self, mock_initialize_clients, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
+    @patch("builtins.input", side_effect=["invalid"])
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register.ModelRegister.initialize_clients",
+        return_value=True,
+    )
+    def test_register_model_interactive_invalid_choice(
+        self, mock_initialize_clients, mock_input
+    ):
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
 
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             model_register.register_model_interactive()
-            mock_print.assert_called_with('\x1b[31mInvalid choice. Exiting model registration.\x1b[0m')
+            mock_print.assert_called_with(
+                "\x1b[31mInvalid choice. Exiting model registration.\x1b[0m"
+            )
 
-    @patch('builtins.input', side_effect=['1'])
+    @patch("builtins.input", side_effect=["1"])
     def test_prompt_opensource_model_registration_register_now(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        with patch.object(model_register, 'register_model_opensource_interactive') as mock_register:
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        with patch.object(
+            model_register, "register_model_opensource_interactive"
+        ) as mock_register:
             model_register.prompt_opensource_model_registration()
             mock_register.assert_called_once()
 
-    @patch('builtins.input', side_effect=['2'])
+    @patch("builtins.input", side_effect=["2"])
     def test_prompt_opensource_model_registration_register_later(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        with patch('builtins.print') as mock_print:
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        with patch("builtins.print") as mock_print:
             model_register.prompt_opensource_model_registration()
-            mock_print.assert_called_with('Skipping model registration. You can register models later using the appropriate commands.')
+            mock_print.assert_called_with(
+                "Skipping model registration. You can register models later using the appropriate commands."
+            )
 
-    @patch('builtins.input', side_effect=['invalid'])
+    @patch("builtins.input", side_effect=["invalid"])
     def test_prompt_opensource_model_registration_invalid_choice(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        with patch('builtins.print') as mock_print:
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        with patch("builtins.print") as mock_print:
             model_register.prompt_opensource_model_registration()
-            mock_print.assert_called_with('\x1b[31mInvalid choice. Skipping model registration.\x1b[0m')
+            mock_print.assert_called_with(
+                "\x1b[31mInvalid choice. Skipping model registration.\x1b[0m"
+            )
 
-    @patch('builtins.input', side_effect=['3'])
+    @patch("builtins.input", side_effect=["3"])
     def test_register_model_opensource_interactive_huggingface(self, mock_input):
-        model_register = ModelRegister(self.config, self.mock_opensearch_client, self.opensearch_domain_name)
-        model_register.service_type = 'open-source'
+        model_register = ModelRegister(
+            self.config, self.mock_opensearch_client, self.opensearch_domain_name
+        )
+        model_register.service_type = "open-source"
 
         model_register.register_model_opensource_interactive()
 
         self.MockHuggingFaceModel.return_value.register_huggingface_model.assert_called_once_with(
-            model_register.opensearch_client, model_register.config, model_register.save_config
+            model_register.opensearch_client,
+            model_register.config,
+            model_register.save_config,
         )
 
-    @patch('builtins.input', side_effect=['1'])
-    def test_register_model_opensource_interactive_no_opensearch_client(self, mock_input):
+    @patch("builtins.input", side_effect=["1"])
+    def test_register_model_opensource_interactive_no_opensearch_client(
+        self, mock_input
+    ):
         model_register = ModelRegister(self.config, None, self.opensearch_domain_name)
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             model_register.register_model_opensource_interactive()
-            mock_print.assert_called_with('\x1b[31mOpenSearch client is not initialized. Please run setup again.\x1b[0m')
+            mock_print.assert_called_with(
+                "\x1b[31mOpenSearch client is not initialized. Please run setup again.\x1b[0m"
+            )
+
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_SecretsHelper.py b/tests/rag/test_SecretsHelper.py
index e349b53b..9f2454e3 100644
--- a/tests/rag/test_SecretsHelper.py
+++ b/tests/rag/test_SecretsHelper.py
@@ -5,117 +5,138 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import unittest
-from unittest.mock import patch, MagicMock
-from botocore.exceptions import ClientError
 import json
 import logging
+import unittest
+from unittest.mock import MagicMock, patch
+
+from botocore.exceptions import ClientError
+
 # Adjust the import path as necessary
 from opensearch_py_ml.ml_commons.SecretsHelper import SecretHelper
 
+
 class TestSecretHelper(unittest.TestCase):
     @classmethod
     def setUpClass(cls):
         # Suppress logging below ERROR level during tests
         logging.basicConfig(level=logging.ERROR)
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_create_secret_error_logging(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         error_response = {
-            'Error': {
-                'Code': 'InternalServiceError',
-                'Message': 'An unspecified error occurred'
+            "Error": {
+                "Code": "InternalServiceError",
+                "Message": "An unspecified error occurred",
             }
         }
-        mock_secretsmanager.create_secret.side_effect = ClientError(error_response, 'CreateSecret')
+        mock_secretsmanager.create_secret.side_effect = ClientError(
+            error_response, "CreateSecret"
+        )
 
-        secret_helper = SecretHelper(region='us-east-1')
-        with self.assertLogs('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper', level='ERROR') as cm:
-            result = secret_helper.create_secret('new-secret', {'key': 'value'})
+        secret_helper = SecretHelper(region="us-east-1")
+        with self.assertLogs(
+            "opensearch_py_ml.ml_commons.SecretsHelper", level="ERROR"
+        ) as cm:
+            result = secret_helper.create_secret("new-secret", {"key": "value"})
             self.assertIsNone(result)
-        self.assertIn('Error creating secret', cm.output[0])
+        self.assertIn("Error creating secret", cm.output[0])
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_get_secret_arn_success(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         mock_secretsmanager.describe_secret.return_value = {
-            'ARN': 'arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret'
+            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
         }
 
-        secret_helper = SecretHelper(region='us-east-1')
-        result = secret_helper.get_secret_arn('my-secret')
-        self.assertEqual(result, 'arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret')
-        mock_secretsmanager.describe_secret.assert_called_with(SecretId='my-secret')
+        secret_helper = SecretHelper(region="us-east-1")
+        result = secret_helper.get_secret_arn("my-secret")
+        self.assertEqual(
+            result, "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
+        )
+        mock_secretsmanager.describe_secret.assert_called_with(SecretId="my-secret")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_get_secret_arn_not_found(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         error_response = {
-            'Error': {
-                'Code': 'ResourceNotFoundException',
-                'Message': 'Secret not found'
+            "Error": {
+                "Code": "ResourceNotFoundException",
+                "Message": "Secret not found",
             }
         }
-        mock_secretsmanager.describe_secret.side_effect = ClientError(error_response, 'DescribeSecret')
+        mock_secretsmanager.describe_secret.side_effect = ClientError(
+            error_response, "DescribeSecret"
+        )
 
-        secret_helper = SecretHelper(region='us-east-1')
-        result = secret_helper.get_secret_arn('nonexistent-secret')
+        secret_helper = SecretHelper(region="us-east-1")
+        result = secret_helper.get_secret_arn("nonexistent-secret")
         self.assertIsNone(result)
-        mock_secretsmanager.describe_secret.assert_called_with(SecretId='nonexistent-secret')
+        mock_secretsmanager.describe_secret.assert_called_with(
+            SecretId="nonexistent-secret"
+        )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_get_secret_success(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
-        mock_secretsmanager.get_secret_value.return_value = {'SecretString': 'my-secret-value'}
+        mock_secretsmanager.get_secret_value.return_value = {
+            "SecretString": "my-secret-value"
+        }
 
-        secret_helper = SecretHelper(region='us-east-1')
-        result = secret_helper.get_secret('my-secret')
-        self.assertEqual(result, 'my-secret-value')
-        mock_secretsmanager.get_secret_value.assert_called_with(SecretId='my-secret')
+        secret_helper = SecretHelper(region="us-east-1")
+        result = secret_helper.get_secret("my-secret")
+        self.assertEqual(result, "my-secret-value")
+        mock_secretsmanager.get_secret_value.assert_called_with(SecretId="my-secret")
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_get_secret_not_found(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         error_response = {
-            'Error': {
-                'Code': 'ResourceNotFoundException',
-                'Message': 'Secret not found'
+            "Error": {
+                "Code": "ResourceNotFoundException",
+                "Message": "Secret not found",
             }
         }
-        mock_secretsmanager.get_secret_value.side_effect = ClientError(error_response, 'GetSecretValue')
+        mock_secretsmanager.get_secret_value.side_effect = ClientError(
+            error_response, "GetSecretValue"
+        )
 
-        secret_helper = SecretHelper(region='us-east-1')
-        result = secret_helper.get_secret('nonexistent-secret')
+        secret_helper = SecretHelper(region="us-east-1")
+        result = secret_helper.get_secret("nonexistent-secret")
         self.assertIsNone(result)
-        mock_secretsmanager.get_secret_value.assert_called_with(SecretId='nonexistent-secret')
+        mock_secretsmanager.get_secret_value.assert_called_with(
+            SecretId="nonexistent-secret"
+        )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.SecretsHelper.boto3.client')
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_create_secret_success(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         mock_secretsmanager.create_secret.return_value = {
-            'ARN': 'arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret'
+            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
         }
 
-        secret_helper = SecretHelper(region='us-east-1')
-        result = secret_helper.create_secret('new-secret', {'key': 'value'})
-        self.assertEqual(result, 'arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret')
+        secret_helper = SecretHelper(region="us-east-1")
+        result = secret_helper.create_secret("new-secret", {"key": "value"})
+        self.assertEqual(
+            result, "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
+        )
         mock_secretsmanager.create_secret.assert_called_with(
-            Name='new-secret',
-            SecretString=json.dumps({'key': 'value'})
+            Name="new-secret", SecretString=json.dumps({"key": "value"})
         )
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_embedding_client.py b/tests/rag/test_embedding_client.py
new file mode 100644
index 00000000..fc1826a3
--- /dev/null
+++ b/tests/rag/test_embedding_client.py
@@ -0,0 +1,103 @@
+# SPDX-License-Identifier: Apache-2.0
+# The OpenSearch Contributors require contributions made to
+# this file be licensed under the Apache-2.0 license or a
+# compatible open source license.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
+
+import unittest
+from unittest.mock import MagicMock, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.embedding_client import (
+    EmbeddingClient,
+)
+
+
+class TestEmbeddingClient(unittest.TestCase):
+
+    def setUp(self):
+        self.mock_opensearch_client = MagicMock()
+        self.embedding_model_id = "test_model_id"
+        self.client = EmbeddingClient(
+            self.mock_opensearch_client, self.embedding_model_id
+        )
+
+    def test_initialization(self):
+        self.assertEqual(self.client.opensearch_client, self.mock_opensearch_client)
+        self.assertEqual(self.client.embedding_model_id, self.embedding_model_id)
+
+    @patch("time.sleep")
+    def test_get_text_embedding_success(self, mock_sleep):
+        mock_response = {"inference_results": [{"output": [{"data": [0.1, 0.2, 0.3]}]}]}
+        self.mock_opensearch_client.transport.perform_request.return_value = (
+            mock_response
+        )
+
+        result = self.client.get_text_embedding("test text")
+        self.assertEqual(result, [0.1, 0.2, 0.3])
+
+        self.mock_opensearch_client.transport.perform_request.assert_called_once_with(
+            method="POST",
+            url=f"/_plugins/_ml/_predict/text_embedding/{self.embedding_model_id}",
+            body={"text_docs": ["test text"]},
+        )
+
+    @patch("time.sleep")
+    def test_get_text_embedding_no_results(self, mock_sleep):
+        mock_response = {"inference_results": []}
+        self.mock_opensearch_client.transport.perform_request.return_value = (
+            mock_response
+        )
+
+        result = self.client.get_text_embedding("test text")
+        self.assertIsNone(result)
+
+    @patch("time.sleep")
+    def test_get_text_embedding_unexpected_format(self, mock_sleep):
+        mock_response = {"inference_results": [{"output": "unexpected"}]}
+        self.mock_opensearch_client.transport.perform_request.return_value = (
+            mock_response
+        )
+
+        result = self.client.get_text_embedding("test text")
+        self.assertIsNone(result)
+
+    @patch("time.sleep")
+    def test_get_text_embedding_retry_success(self, mock_sleep):
+        self.mock_opensearch_client.transport.perform_request.side_effect = [
+            Exception("Test error"),
+            {"inference_results": [{"output": [{"data": [0.1, 0.2, 0.3]}]}]},
+        ]
+
+        result = self.client.get_text_embedding("test text")
+        self.assertEqual(result, [0.1, 0.2, 0.3])
+        self.assertEqual(
+            self.mock_opensearch_client.transport.perform_request.call_count, 2
+        )
+
+    @patch("time.sleep")
+    def test_get_text_embedding_max_retries_exceeded(self, mock_sleep):
+        self.mock_opensearch_client.transport.perform_request.side_effect = Exception(
+            "Test error"
+        )
+
+        with self.assertRaises(Exception):
+            self.client.get_text_embedding("test text", max_retries=3)
+
+        self.assertEqual(
+            self.mock_opensearch_client.transport.perform_request.call_count, 3
+        )
+
+    @patch("time.sleep")
+    def test_get_text_embedding_alternative_output_format(self, mock_sleep):
+        mock_response = {"inference_results": [{"output": {"data": [0.1, 0.2, 0.3]}}]}
+        self.mock_opensearch_client.transport.perform_request.return_value = (
+            mock_response
+        )
+
+        result = self.client.get_text_embedding("test text")
+        self.assertEqual(result, [0.1, 0.2, 0.3])
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_ingest.py b/tests/rag/test_ingest.py
index d47f4b30..f0c9cf79 100644
--- a/tests/rag/test_ingest.py
+++ b/tests/rag/test_ingest.py
@@ -5,25 +5,27 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
+import json
 import unittest
-from unittest.mock import patch, MagicMock, mock_open
-import os
-import io
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest import Ingest
+from unittest.mock import MagicMock, mock_open, patch
+
 from opensearchpy import exceptions as opensearch_exceptions
-import json
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest import Ingest
+
 
 class TestIngest(unittest.TestCase):
     def setUp(self):
         self.config = {
-            'region': 'us-east-1',
-            'index_name': 'test-index',
-            'embedding_model_id': 'test-embedding-model-id',
-            'ingest_pipeline_name': 'test-ingest-pipeline'
+            "region": "us-east-1",
+            "index_name": "test-index",
+            "embedding_model_id": "test-embedding-model-id",
+            "ingest_pipeline_name": "test-ingest-pipeline",
         }
         self.ingest = Ingest(self.config)
+        self.ingest.embedding_client = MagicMock()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector")
     def test_initialize_clients_success(self, mock_opensearch_connector):
         mock_instance = mock_opensearch_connector.return_value
         mock_instance.initialize_opensearch_client.return_value = True
@@ -34,7 +36,7 @@ def test_initialize_clients_success(self, mock_opensearch_connector):
         self.assertTrue(result)
         mock_instance.initialize_opensearch_client.assert_called_once()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.OpenSearchConnector")
     def test_initialize_clients_failure(self, mock_opensearch_connector):
         mock_instance = mock_opensearch_connector.return_value
         mock_instance.initialize_opensearch_client.return_value = False
@@ -45,162 +47,182 @@ def test_initialize_clients_failure(self, mock_opensearch_connector):
         self.assertFalse(result)
         mock_instance.initialize_opensearch_client.assert_called_once()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir")
     def test_ingest_command_with_valid_files(self, mock_isdir, mock_walk, mock_isfile):
-        paths = ['/path/to/dir', '/path/to/file.txt']
-        mock_isfile.side_effect = lambda x: x == '/path/to/file.txt'
-        mock_isdir.side_effect = lambda x: x == '/path/to/dir'
-        mock_walk.return_value = [('/path/to/dir', [], ['file3.pdf'])]
-
-        with patch.object(self.ingest, 'process_and_ingest_data') as mock_process_and_ingest_data:
+        paths = ["/path/to/dir", "/path/to/file.txt"]
+        mock_isfile.side_effect = lambda x: x == "/path/to/file.txt"
+        mock_isdir.side_effect = lambda x: x == "/path/to/dir"
+        mock_walk.return_value = [("/path/to/dir", [], ["file3.pdf"])]
+
+        with patch.object(
+            self.ingest, "process_and_ingest_data"
+        ) as mock_process_and_ingest_data:
             self.ingest.ingest_command(paths)
             mock_process_and_ingest_data.assert_called_once()
             args, kwargs = mock_process_and_ingest_data.call_args
-            expected_files = ['/path/to/file.txt', '/path/to/dir/file3.pdf']
+            expected_files = ["/path/to/file.txt", "/path/to/dir/file3.pdf"]
             self.assertCountEqual(args[0], expected_files)
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isfile")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.walk")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.ingest.os.path.isdir")
     def test_ingest_command_no_valid_files(self, mock_isdir, mock_walk, mock_isfile):
-        paths = ['/invalid/path']
+        paths = ["/invalid/path"]
         mock_isfile.return_value = False
         mock_isdir.return_value = False
 
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             self.ingest.ingest_command(paths)
-            mock_print.assert_any_call('\x1b[33mInvalid path: /invalid/path\x1b[0m')
-            mock_print.assert_any_call('\x1b[31mNo valid files found for ingestion.\x1b[0m')
-
-    @patch.object(Ingest, 'initialize_clients', return_value=True)
-    @patch.object(Ingest, 'create_ingest_pipeline')
-    @patch.object(Ingest, 'process_file')
-    @patch.object(Ingest, 'text_embedding', return_value=[0.1, 0.2, 0.3])
-    def test_process_and_ingest_data(self, mock_text_embedding, mock_process_file, mock_create_pipeline, mock_initialize_clients):
-        file_paths = ['/path/to/file1.txt']
-        documents = [{'text': 'Sample text'}]
+            mock_print.assert_any_call("\x1b[33mInvalid path: /invalid/path\x1b[0m")
+            mock_print.assert_any_call(
+                "\x1b[31mNo valid files found for ingestion.\x1b[0m"
+            )
+
+    @patch.object(Ingest, "initialize_clients", return_value=True)
+    @patch.object(Ingest, "create_ingest_pipeline")
+    @patch.object(Ingest, "process_file")
+    def test_process_and_ingest_data(
+        self, mock_process_file, mock_create_pipeline, mock_initialize_clients
+    ):
+        file_paths = ["/path/to/file1.txt"]
+        documents = [{"text": "Sample text"}]
         mock_process_file.return_value = documents
 
-        # Patch the 'bulk_index' method on the instance's 'opensearch' attribute
-        with patch.object(self.ingest.opensearch, 'bulk_index', return_value=(1, 0)) as mock_bulk_index:
+        mock_embedding_client = MagicMock()
+        mock_embedding_client.get_text_embedding.return_value = [0.1, 0.2, 0.3]
+        self.ingest.embedding_client = mock_embedding_client
+
+        with patch.object(
+            self.ingest.opensearch, "bulk_index", return_value=(1, 0)
+        ) as mock_bulk_index:
             self.ingest.process_and_ingest_data(file_paths)
 
             mock_initialize_clients.assert_called_once()
             mock_create_pipeline.assert_called_once_with(self.ingest.pipeline_name)
-            mock_process_file.assert_called_once_with('/path/to/file1.txt')
-            mock_text_embedding.assert_called_once_with('Sample text')
+            mock_process_file.assert_called_once_with("/path/to/file1.txt")
+            mock_embedding_client.get_text_embedding.assert_called_once_with(
+                "Sample text"
+            )
             mock_bulk_index.assert_called_once()
 
     def test_create_ingest_pipeline_exists(self):
-        pipeline_id = 'test-pipeline'
-        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
+        pipeline_id = "test-pipeline"
+        with patch.object(
+            self.ingest.opensearch, "opensearch_client"
+        ) as mock_opensearch_client:
             mock_opensearch_client.ingest.get_pipeline.return_value = {}
 
-            with patch('builtins.print') as mock_print:
+            with patch("builtins.print") as mock_print:
                 self.ingest.create_ingest_pipeline(pipeline_id)
-                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(id=pipeline_id)
-                mock_print.assert_any_call(f"\nIngest pipeline '{pipeline_id}' already exists.")
+                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(
+                    id=pipeline_id
+                )
+                mock_print.assert_any_call(
+                    f"\nIngest pipeline '{pipeline_id}' already exists."
+                )
 
     def test_create_ingest_pipeline_not_exists(self):
-        pipeline_id = 'test-pipeline'
-        pipeline_body = {
-            "description": "A text chunking ingest pipeline",
+        pipeline_id = "test-pipeline"
+        expected_pipeline_body = {
+            "description": "A text chunking and embedding ingest pipeline",
             "processors": [
                 {
                     "text_chunking": {
-                        "algorithm": {
-                            "fixed_token_length": {
-                                "token_limit": 384,
-                                "overlap_rate": 0.2,
-                                "tokenizer": "standard"
-                            }
-                        },
-                        "field_map": {
-                            "nominee_text": "passage_chunk"
-                        }
+                        "algorithm": {"delimiter": {"delimiter": "."}},
+                        "field_map": {"passage_text": "passage_chunk"},
                     }
-                }
-            ]
+                },
+                {
+                    "text_embedding": {
+                        "model_id": self.config["embedding_model_id"],
+                        "field_map": {"passage_chunk": "passage_embedding"},
+                    }
+                },
+            ],
         }
 
-        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
-            mock_opensearch_client.ingest.get_pipeline.side_effect = opensearch_exceptions.NotFoundError(
-                404, "Not Found", {"error": "Pipeline not found"}
+        with patch.object(
+            self.ingest.opensearch, "opensearch_client"
+        ) as mock_opensearch_client:
+            mock_opensearch_client.ingest.get_pipeline.side_effect = (
+                opensearch_exceptions.NotFoundError(
+                    404, "Not Found", {"error": "Pipeline not found"}
+                )
             )
 
-            with patch('builtins.print') as mock_print:
+            with patch("builtins.print") as mock_print:
                 self.ingest.create_ingest_pipeline(pipeline_id)
 
-                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(id=pipeline_id)
-                mock_opensearch_client.ingest.put_pipeline.assert_called_once_with(id=pipeline_id, body=pipeline_body)
-                mock_print.assert_any_call(f"\nIngest pipeline '{pipeline_id}' created successfully.")
-
-    @patch('builtins.open', new_callable=mock_open, read_data='col1,col2\nvalue1,value2\n')
+                mock_opensearch_client.ingest.get_pipeline.assert_called_once_with(
+                    id=pipeline_id
+                )
+                mock_opensearch_client.ingest.put_pipeline.assert_called_once_with(
+                    id=pipeline_id, body=expected_pipeline_body
+                )
+                mock_print.assert_any_call(
+                    f"\nIngest pipeline '{pipeline_id}' created successfully."
+                )
+
+    @patch(
+        "builtins.open", new_callable=mock_open, read_data="col1,col2\nvalue1,value2\n"
+    )
     def test_process_csv(self, mock_file):
-        file_path = '/path/to/file.csv'
-        with patch('csv.DictReader') as mock_csv_reader:
-            mock_csv_reader.return_value = [{'col1': 'value1', 'col2': 'value2'}]
+        file_path = "/path/to/file.csv"
+        with patch("csv.DictReader") as mock_csv_reader:
+            mock_csv_reader.return_value = [{"col1": "value1", "col2": "value2"}]
             result = self.ingest.process_csv(file_path)
-            mock_file.assert_called_once_with(file_path, 'r', newline='', encoding='utf-8')
-            self.assertEqual(result, [{'text': json.dumps({'col1': 'value1', 'col2': 'value2'})}])
+            mock_file.assert_called_once_with(
+                file_path, "r", newline="", encoding="utf-8"
+            )
+            self.assertEqual(
+                result, [{"text": json.dumps({"col1": "value1", "col2": "value2"})}]
+            )
 
-    @patch('builtins.open', new_callable=mock_open, read_data='Sample TXT data')
+    @patch("builtins.open", new_callable=mock_open, read_data="Sample TXT data")
     def test_process_txt(self, mock_file):
-        file_path = '/path/to/file.txt'
+        file_path = "/path/to/file.txt"
         result = self.ingest.process_txt(file_path)
-        mock_file.assert_called_once_with(file_path, 'r')
-        self.assertEqual(result, [{'text': 'Sample TXT data'}])
+        mock_file.assert_called_once_with(file_path, "r")
+        self.assertEqual(result, [{"text": "Sample TXT data"}])
 
-    @patch('PyPDF2.PdfReader')
-    @patch('builtins.open', new_callable=mock_open)
+    @patch("PyPDF2.PdfReader")
+    @patch("builtins.open", new_callable=mock_open)
     def test_process_pdf(self, mock_file, mock_pdf_reader):
-        file_path = '/path/to/file.pdf'
+        file_path = "/path/to/file.pdf"
         mock_pdf_reader_instance = mock_pdf_reader.return_value
         mock_page = MagicMock()
-        mock_page.extract_text.return_value = 'Sample PDF page text'
+        mock_page.extract_text.return_value = "Sample PDF page text"
         mock_pdf_reader_instance.pages = [mock_page]
 
         result = self.ingest.process_pdf(file_path)
 
-        mock_file.assert_called_once_with(file_path, 'rb')
+        mock_file.assert_called_once_with(file_path, "rb")
         mock_pdf_reader.assert_called_once_with(mock_file.return_value)
-        self.assertEqual(result, [{'text': 'Sample PDF page text'}])
+        self.assertEqual(result, [{"text": "Sample PDF page text"}])
 
-    @patch('time.sleep', return_value=None)
-    def test_text_embedding_failure(self, mock_sleep):
-        text = 'Sample text'
+    def test_text_embedding_failure(self):
+        text = "Sample text"
+        self.ingest.embedding_client.get_text_embedding.side_effect = Exception(
+            "Test exception"
+        )
 
-        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
-            mock_opensearch_client.transport.perform_request.side_effect = Exception('Test exception')
+        with self.assertRaises(Exception) as context:
+            self.ingest.embedding_client.get_text_embedding(text)
 
-            with patch('builtins.print') as mock_print:
-                with self.assertRaises(Exception) as context:
-                    self.ingest.text_embedding(text, max_retries=1)
-                self.assertTrue('Test exception' in str(context.exception))
-                mock_print.assert_any_call('Error on attempt 1: Test exception')
+        self.assertTrue("Test exception" in str(context.exception))
 
     def test_text_embedding_success(self):
-        text = 'Sample text'
+        text = "Sample text"
         embedding = [0.1, 0.2, 0.3]
-        response = {
-            'inference_results': [
-                {
-                    'output': [
-                        {'data': embedding}
-                    ]
-                }
-            ]
-        }
+        self.ingest.embedding_client.get_text_embedding.return_value = embedding
 
-        with patch.object(self.ingest.opensearch, 'opensearch_client') as mock_opensearch_client:
-            mock_opensearch_client.transport.perform_request.return_value = response
+        result = self.ingest.embedding_client.get_text_embedding(text)
 
-            result = self.ingest.text_embedding(text)
+        self.assertEqual(result, embedding)
+        self.ingest.embedding_client.get_text_embedding.assert_called_once_with(text)
 
-            self.assertEqual(result, embedding)
-            mock_opensearch_client.transport.perform_request.assert_called_once()
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_ml_models/test_BedrockModel.py b/tests/rag/test_ml_models/test_BedrockModel.py
index 71dc8a21..73d7b97a 100644
--- a/tests/rag/test_ml_models/test_BedrockModel.py
+++ b/tests/rag/test_ml_models/test_BedrockModel.py
@@ -6,10 +6,12 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import Mock, patch, call
-import json
-from io import StringIO
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import BedrockModel
+from unittest.mock import Mock, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.BedrockModel import (
+    BedrockModel,
+)
+
 
 class TestBedrockModel(unittest.TestCase):
 
@@ -24,77 +26,103 @@ def setUp(self):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.mock_iam_role_helper
+            self.mock_iam_role_helper,
         )
 
     def test_init(self):
         self.assertEqual(self.bedrock_model.aws_region, self.aws_region)
-        self.assertEqual(self.bedrock_model.opensearch_domain_name, self.opensearch_domain_name)
-        self.assertEqual(self.bedrock_model.opensearch_username, self.opensearch_username)
-        self.assertEqual(self.bedrock_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(
+            self.bedrock_model.opensearch_domain_name, self.opensearch_domain_name
+        )
+        self.assertEqual(
+            self.bedrock_model.opensearch_username, self.opensearch_username
+        )
+        self.assertEqual(
+            self.bedrock_model.opensearch_password, self.opensearch_password
+        )
         self.assertEqual(self.bedrock_model.iam_role_helper, self.mock_iam_role_helper)
 
-    @patch('builtins.input', side_effect=['', '1'])
+    @patch("builtins.input", side_effect=["", "1"])
     def test_register_bedrock_model_default(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_role.return_value = "test-connector-id"
         mock_helper.create_model.return_value = "test-model-id"
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.bedrock_model.register_bedrock_model(mock_helper, mock_config, mock_save_config)
+        self.bedrock_model.register_bedrock_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_helper.create_connector_with_role.assert_called_once()
         mock_helper.create_model.assert_called_once()
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
-    @patch('builtins.input', side_effect=['custom-region', '2', '{"name": "Custom Model", "description": "Custom description"}'])
+    @patch(
+        "builtins.input",
+        side_effect=[
+            "custom-region",
+            "2",
+            '{"name": "Custom Model", "description": "Custom description"}',
+        ],
+    )
     def test_register_bedrock_model_custom(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_role.return_value = "test-connector-id"
         mock_helper.create_model.return_value = "test-model-id"
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.bedrock_model.register_bedrock_model(mock_helper, mock_config, mock_save_config)
+        self.bedrock_model.register_bedrock_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_helper.create_connector_with_role.assert_called_once()
-        mock_helper.create_model.assert_called_once_with("Custom Model", "Custom description", "test-connector-id", "my_test_create_bedrock_connector_role")
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_helper.create_model.assert_called_once_with(
+            "Custom Model",
+            "Custom description",
+            "test-connector-id",
+            "my_test_create_bedrock_connector_role",
+        )
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
     def test_save_model_id(self):
         mock_config = {}
         mock_save_config = Mock()
         self.bedrock_model.save_model_id(mock_config, mock_save_config, "test-model-id")
-        self.assertEqual(mock_config, {'embedding_model_id': 'test-model-id'})
+        self.assertEqual(mock_config, {"embedding_model_id": "test-model-id"})
         mock_save_config.assert_called_once_with(mock_config)
 
-    @patch('builtins.input', return_value='1')
+    @patch("builtins.input", return_value="1")
     def test_get_custom_model_details_default(self, mock_input):
         default_input = {"name": "Default Model"}
         result = self.bedrock_model.get_custom_model_details(default_input)
         self.assertEqual(result, default_input)
 
-    @patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}'])
+    @patch("builtins.input", side_effect=["2", '{"name": "Custom Model"}'])
     def test_get_custom_model_details_custom(self, mock_input):
         default_input = {"name": "Default Model"}
         result = self.bedrock_model.get_custom_model_details(default_input)
         self.assertEqual(result, {"name": "Custom Model"})
 
-
-    @patch('builtins.input', return_value='2\n{invalid json}')
+    @patch("builtins.input", return_value="2\n{invalid json}")
     def test_get_custom_model_details_invalid_json(self, mock_input):
         default_input = {"name": "Default Model"}
         result = self.bedrock_model.get_custom_model_details(default_input)
         self.assertIsNone(result)
 
-    @patch('builtins.input', return_value='3')
+    @patch("builtins.input", return_value="3")
     def test_get_custom_model_details_invalid_choice(self, mock_input):
         default_input = {"name": "Default Model"}
         result = self.bedrock_model.get_custom_model_details(default_input)
         self.assertIsNone(result)
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_ml_models/test_CohereModel.py b/tests/rag/test_ml_models/test_CohereModel.py
index 4e499090..9cf0803a 100644
--- a/tests/rag/test_ml_models/test_CohereModel.py
+++ b/tests/rag/test_ml_models/test_CohereModel.py
@@ -6,10 +6,12 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import Mock, patch, call
-import json
-from io import StringIO
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import CohereModel
+from unittest.mock import Mock, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.CohereModel import (
+    CohereModel,
+)
+
 
 class TestCohereModel(unittest.TestCase):
 
@@ -24,118 +26,141 @@ def setUp(self):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.mock_iam_role_helper
+            self.mock_iam_role_helper,
         )
 
     def test_init(self):
         self.assertEqual(self.cohere_model.aws_region, self.aws_region)
-        self.assertEqual(self.cohere_model.opensearch_domain_name, self.opensearch_domain_name)
-        self.assertEqual(self.cohere_model.opensearch_username, self.opensearch_username)
-        self.assertEqual(self.cohere_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(
+            self.cohere_model.opensearch_domain_name, self.opensearch_domain_name
+        )
+        self.assertEqual(
+            self.cohere_model.opensearch_username, self.opensearch_username
+        )
+        self.assertEqual(
+            self.cohere_model.opensearch_password, self.opensearch_password
+        )
         self.assertEqual(self.cohere_model.iam_role_helper, self.mock_iam_role_helper)
 
-    @patch('builtins.input', side_effect=['test-secret', 'test-api-key', '1'])
+    @patch("builtins.input", side_effect=["test-secret", "test-api-key", "1"])
     def test_register_cohere_model(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_secret.return_value = "test-connector-id"
         mock_helper.create_model.return_value = "test-model-id"
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.cohere_model.register_cohere_model(mock_helper, mock_config, mock_save_config)
+        self.cohere_model.register_cohere_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_helper.create_connector_with_secret.assert_called_once()
         mock_helper.create_model.assert_called_once()
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
-    @patch('builtins.input', side_effect=['test-api-key', '1'])
-    @patch('time.time', return_value=1000000)
+    @patch("builtins.input", side_effect=["test-api-key", "1"])
+    @patch("time.time", return_value=1000000)
     def test_register_cohere_model_opensource(self, mock_time, mock_input):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'connector_id': 'test-connector-id'},
-            {'model_group_id': 'test-model-group-id'},
-            {'task_id': 'test-task-id'},
-            {'state': 'COMPLETED', 'model_id': 'test-model-id'},
-            {}  # for model deployment
+            {"connector_id": "test-connector-id"},
+            {"model_group_id": "test-model-group-id"},
+            {"task_id": "test-task-id"},
+            {"state": "COMPLETED", "model_id": "test-model-id"},
+            {},  # for model deployment
         ]
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.cohere_model.register_cohere_model_opensource(mock_opensearch_client, mock_config, mock_save_config)
+        self.cohere_model.register_cohere_model_opensource(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 5)
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
     def test_get_custom_model_details_default(self):
-        with patch('builtins.input', return_value='1'):
+        with patch("builtins.input", return_value="1"):
             default_input = {"name": "Default Model"}
             result = self.cohere_model.get_custom_model_details(default_input)
             self.assertEqual(result, default_input)
 
     def test_get_custom_model_details_custom(self):
-        with patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}']):
+        with patch("builtins.input", side_effect=["2", '{"name": "Custom Model"}']):
             default_input = {"name": "Default Model"}
             result = self.cohere_model.get_custom_model_details(default_input)
             self.assertEqual(result, {"name": "Custom Model"})
 
     def test_get_custom_model_details_invalid_json(self):
-        with patch('builtins.input', side_effect=['2', 'invalid json']):
+        with patch("builtins.input", side_effect=["2", "invalid json"]):
             default_input = {"name": "Default Model"}
             result = self.cohere_model.get_custom_model_details(default_input)
             self.assertIsNone(result)
 
     def test_get_custom_model_details_invalid_choice(self):
-        with patch('builtins.input', return_value='3'):
+        with patch("builtins.input", return_value="3"):
             default_input = {"name": "Default Model"}
             result = self.cohere_model.get_custom_model_details(default_input)
             self.assertIsNone(result)
 
     def test_get_custom_json_input_valid(self):
-        with patch('builtins.input', return_value='{"key": "value"}'):
+        with patch("builtins.input", return_value='{"key": "value"}'):
             result = self.cohere_model.get_custom_json_input()
             self.assertEqual(result, {"key": "value"})
 
     def test_get_custom_json_input_invalid(self):
-        with patch('builtins.input', return_value='invalid json'):
+        with patch("builtins.input", return_value="invalid json"):
             result = self.cohere_model.get_custom_json_input()
             self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'RUNNING'},
-            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+            {"state": "RUNNING"},
+            {"state": "RUNNING"},
+            {"state": "COMPLETED", "model_id": "test-model-id"},
         ]
-        
-        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
-        self.assertEqual(result, 'test-model-id')
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+        result = self.cohere_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
+        self.assertEqual(result, "test-model-id")
+
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'FAILED'}
+            {"state": "RUNNING"},
+            {"state": "FAILED"},
         ]
-        
-        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+
+        result = self.cohere_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
         self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 1000])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 1000])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
-        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
-        
-        result = self.cohere_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        mock_opensearch_client.transport.perform_request.return_value = {
+            "state": "RUNNING"
+        }
+
+        result = self.cohere_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id", timeout=5
+        )
         self.assertIsNone(result)
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_ml_models/test_OpenAIModel.py b/tests/rag/test_ml_models/test_OpenAIModel.py
index 0d225e3c..a9b55f33 100644
--- a/tests/rag/test_ml_models/test_OpenAIModel.py
+++ b/tests/rag/test_ml_models/test_OpenAIModel.py
@@ -6,10 +6,12 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import Mock, patch, call
-import json
-from io import StringIO
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import OpenAIModel
+from unittest.mock import Mock, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.OpenAIModel import (
+    OpenAIModel,
+)
+
 
 class TestOpenAIModel(unittest.TestCase):
 
@@ -24,118 +26,141 @@ def setUp(self):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.mock_iam_role_helper
+            self.mock_iam_role_helper,
         )
 
     def test_init(self):
         self.assertEqual(self.openai_model.aws_region, self.aws_region)
-        self.assertEqual(self.openai_model.opensearch_domain_name, self.opensearch_domain_name)
-        self.assertEqual(self.openai_model.opensearch_username, self.opensearch_username)
-        self.assertEqual(self.openai_model.opensearch_password, self.opensearch_password)
+        self.assertEqual(
+            self.openai_model.opensearch_domain_name, self.opensearch_domain_name
+        )
+        self.assertEqual(
+            self.openai_model.opensearch_username, self.opensearch_username
+        )
+        self.assertEqual(
+            self.openai_model.opensearch_password, self.opensearch_password
+        )
         self.assertEqual(self.openai_model.iam_role_helper, self.mock_iam_role_helper)
 
-    @patch('builtins.input', side_effect=['test-secret', 'test-api-key', '1'])
+    @patch("builtins.input", side_effect=["test-secret", "test-api-key", "1"])
     def test_register_openai_model(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_secret.return_value = "test-connector-id"
         mock_helper.create_model.return_value = "test-model-id"
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.openai_model.register_openai_model(mock_helper, mock_config, mock_save_config)
+        self.openai_model.register_openai_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_helper.create_connector_with_secret.assert_called_once()
         mock_helper.create_model.assert_called_once()
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
-    @patch('builtins.input', side_effect=['test-api-key', '1'])
-    @patch('time.time', return_value=1000000)
+    @patch("builtins.input", side_effect=["test-api-key", "1"])
+    @patch("time.time", return_value=1000000)
     def test_register_openai_model_opensource(self, mock_time, mock_input):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'connector_id': 'test-connector-id'},
-            {'model_group_id': 'test-model-group-id'},
-            {'task_id': 'test-task-id'},
-            {'state': 'COMPLETED', 'model_id': 'test-model-id'},
-            {}  # for model deployment
+            {"connector_id": "test-connector-id"},
+            {"model_group_id": "test-model-group-id"},
+            {"task_id": "test-task-id"},
+            {"state": "COMPLETED", "model_id": "test-model-id"},
+            {},  # for model deployment
         ]
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.openai_model.register_openai_model_opensource(mock_opensearch_client, mock_config, mock_save_config)
+        self.openai_model.register_openai_model_opensource(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 5)
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
     def test_get_custom_model_details_default(self):
-        with patch('builtins.input', return_value='1'):
+        with patch("builtins.input", return_value="1"):
             default_input = {"name": "Default Model"}
             result = self.openai_model.get_custom_model_details(default_input)
             self.assertEqual(result, default_input)
 
     def test_get_custom_model_details_custom(self):
-        with patch('builtins.input', side_effect=['2', '{"name": "Custom Model"}']):
+        with patch("builtins.input", side_effect=["2", '{"name": "Custom Model"}']):
             default_input = {"name": "Default Model"}
             result = self.openai_model.get_custom_model_details(default_input)
             self.assertEqual(result, {"name": "Custom Model"})
 
     def test_get_custom_model_details_invalid_json(self):
-        with patch('builtins.input', side_effect=['2', 'invalid json']):
+        with patch("builtins.input", side_effect=["2", "invalid json"]):
             default_input = {"name": "Default Model"}
             result = self.openai_model.get_custom_model_details(default_input)
             self.assertIsNone(result)
 
     def test_get_custom_model_details_invalid_choice(self):
-        with patch('builtins.input', return_value='3'):
+        with patch("builtins.input", return_value="3"):
             default_input = {"name": "Default Model"}
             result = self.openai_model.get_custom_model_details(default_input)
             self.assertIsNone(result)
 
     def test_get_custom_json_input_valid(self):
-        with patch('builtins.input', return_value='{"key": "value"}'):
+        with patch("builtins.input", return_value='{"key": "value"}'):
             result = self.openai_model.get_custom_json_input()
             self.assertEqual(result, {"key": "value"})
 
     def test_get_custom_json_input_invalid(self):
-        with patch('builtins.input', return_value='invalid json'):
+        with patch("builtins.input", return_value="invalid json"):
             result = self.openai_model.get_custom_json_input()
             self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'RUNNING'},
-            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+            {"state": "RUNNING"},
+            {"state": "RUNNING"},
+            {"state": "COMPLETED", "model_id": "test-model-id"},
         ]
-        
-        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
-        self.assertEqual(result, 'test-model-id')
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+        result = self.openai_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
+        self.assertEqual(result, "test-model-id")
+
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'FAILED'}
+            {"state": "RUNNING"},
+            {"state": "FAILED"},
         ]
-        
-        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+
+        result = self.openai_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
         self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 1000])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 1000])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
-        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
-        
-        result = self.openai_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        mock_opensearch_client.transport.perform_request.return_value = {
+            "state": "RUNNING"
+        }
+
+        result = self.openai_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id", timeout=5
+        )
         self.assertIsNone(result)
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_ml_models/test_PyTorchModel.py b/tests/rag/test_ml_models/test_PyTorchModel.py
index 301f6259..8c025fa0 100644
--- a/tests/rag/test_ml_models/test_PyTorchModel.py
+++ b/tests/rag/test_ml_models/test_PyTorchModel.py
@@ -6,10 +6,12 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import Mock, patch, call, mock_open
-import json
-from io import StringIO
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import CustomPyTorchModel
+from unittest.mock import Mock, mock_open, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.PyTorchModel import (
+    CustomPyTorchModel,
+)
+
 
 class TestCustomPyTorchModel(unittest.TestCase):
 
@@ -24,122 +26,165 @@ def setUp(self):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.mock_iam_role_helper
+            self.mock_iam_role_helper,
         )
 
     def test_init(self):
         self.assertEqual(self.custom_pytorch_model.aws_region, self.aws_region)
-        self.assertEqual(self.custom_pytorch_model.opensearch_domain_name, self.opensearch_domain_name)
-        self.assertEqual(self.custom_pytorch_model.opensearch_username, self.opensearch_username)
-        self.assertEqual(self.custom_pytorch_model.opensearch_password, self.opensearch_password)
-        self.assertEqual(self.custom_pytorch_model.iam_role_helper, self.mock_iam_role_helper)
-
-    @patch('builtins.input', side_effect=['1', '/path/to/model.pt'])
-    @patch('os.path.isfile', return_value=True)
-    @patch('builtins.open', new_callable=mock_open, read_data=b'model_content')
-    def test_register_custom_pytorch_model_default(self, mock_file, mock_isfile, mock_input):
+        self.assertEqual(
+            self.custom_pytorch_model.opensearch_domain_name,
+            self.opensearch_domain_name,
+        )
+        self.assertEqual(
+            self.custom_pytorch_model.opensearch_username, self.opensearch_username
+        )
+        self.assertEqual(
+            self.custom_pytorch_model.opensearch_password, self.opensearch_password
+        )
+        self.assertEqual(
+            self.custom_pytorch_model.iam_role_helper, self.mock_iam_role_helper
+        )
+
+    @patch("builtins.input", side_effect=["1", "/path/to/model.pt"])
+    @patch("os.path.isfile", return_value=True)
+    @patch("builtins.open", new_callable=mock_open, read_data=b"model_content")
+    def test_register_custom_pytorch_model_default(
+        self, mock_file, mock_isfile, mock_input
+    ):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'model_id': 'uploaded_model_id'},
-            {'task_id': 'test-task-id'},
-            {'state': 'COMPLETED', 'model_id': 'registered_model_id'},
-            {}  # for model deployment
+            {"model_id": "uploaded_model_id"},
+            {"task_id": "test-task-id"},
+            {"state": "COMPLETED", "model_id": "registered_model_id"},
+            {},  # for model deployment
         ]
-        
-        mock_config = {'embedding_dimension': 768}
+
+        mock_config = {"embedding_dimension": 768}
         mock_save_config = Mock()
 
-        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+        self.custom_pytorch_model.register_custom_pytorch_model(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 4)
-        mock_save_config.assert_called_once_with({'embedding_dimension': 768, 'embedding_model_id': 'registered_model_id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_dimension": 768, "embedding_model_id": "registered_model_id"}
+        )
 
-    @patch('builtins.input', side_effect=['2', '/path/to/model.pt', '{"name": "custom_model", "model_format": "TORCH_SCRIPT", "model_config": {"embedding_dimension": 512, "framework_type": "CUSTOM", "model_type": "bert"}, "description": "Custom model"}'])
-    @patch('os.path.isfile', return_value=True)
-    @patch('builtins.open', new_callable=mock_open, read_data=b'model_content')
-    def test_register_custom_pytorch_model_custom(self, mock_file, mock_isfile, mock_input):
+    @patch(
+        "builtins.input",
+        side_effect=[
+            "2",
+            "/path/to/model.pt",
+            '{"name": "custom_model", "model_format": "TORCH_SCRIPT", "model_config": {"embedding_dimension": 512, "framework_type": "CUSTOM", "model_type": "bert"}, "description": "Custom model"}',
+        ],
+    )
+    @patch("os.path.isfile", return_value=True)
+    @patch("builtins.open", new_callable=mock_open, read_data=b"model_content")
+    def test_register_custom_pytorch_model_custom(
+        self, mock_file, mock_isfile, mock_input
+    ):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'model_id': 'uploaded_model_id'},
-            {'task_id': 'test-task-id'},
-            {'state': 'COMPLETED', 'model_id': 'registered_model_id'},
-            {}  # for model deployment
+            {"model_id": "uploaded_model_id"},
+            {"task_id": "test-task-id"},
+            {"state": "COMPLETED", "model_id": "registered_model_id"},
+            {},  # for model deployment
         ]
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+        self.custom_pytorch_model.register_custom_pytorch_model(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         self.assertEqual(mock_opensearch_client.transport.perform_request.call_count, 4)
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'registered_model_id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "registered_model_id"}
+        )
 
-    @patch('builtins.input', side_effect=['1', '/nonexistent/path.pt'])
-    @patch('os.path.isfile', return_value=False)
-    def test_register_custom_pytorch_model_file_not_found(self, mock_isfile, mock_input):
+    @patch("builtins.input", side_effect=["1", "/nonexistent/path.pt"])
+    @patch("os.path.isfile", return_value=False)
+    def test_register_custom_pytorch_model_file_not_found(
+        self, mock_isfile, mock_input
+    ):
         mock_opensearch_client = Mock()
         mock_config = {}
         mock_save_config = Mock()
 
-        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+        self.custom_pytorch_model.register_custom_pytorch_model(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         mock_opensearch_client.transport.perform_request.assert_not_called()
         mock_save_config.assert_not_called()
 
-    @patch('builtins.input', return_value='3')
+    @patch("builtins.input", return_value="3")
     def test_register_custom_pytorch_model_invalid_choice(self, mock_input):
         mock_opensearch_client = Mock()
         mock_config = {}
         mock_save_config = Mock()
 
-        self.custom_pytorch_model.register_custom_pytorch_model(mock_opensearch_client, mock_config, mock_save_config)
+        self.custom_pytorch_model.register_custom_pytorch_model(
+            mock_opensearch_client, mock_config, mock_save_config
+        )
 
         mock_opensearch_client.transport.perform_request.assert_not_called()
         mock_save_config.assert_not_called()
 
     def test_get_custom_json_input_valid(self):
-        with patch('builtins.input', return_value='{"key": "value"}'):
+        with patch("builtins.input", return_value='{"key": "value"}'):
             result = self.custom_pytorch_model.get_custom_json_input()
             self.assertEqual(result, {"key": "value"})
 
     def test_get_custom_json_input_invalid(self):
-        with patch('builtins.input', return_value='invalid json'):
+        with patch("builtins.input", return_value="invalid json"):
             result = self.custom_pytorch_model.get_custom_json_input()
             self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_success(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'RUNNING'},
-            {'state': 'COMPLETED', 'model_id': 'test-model-id'}
+            {"state": "RUNNING"},
+            {"state": "RUNNING"},
+            {"state": "COMPLETED", "model_id": "test-model-id"},
         ]
-        
-        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
-        self.assertEqual(result, 'test-model-id')
 
-    @patch('time.time', side_effect=[0, 10, 20, 30])
-    @patch('time.sleep', return_value=None)
+        result = self.custom_pytorch_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
+        self.assertEqual(result, "test-model-id")
+
+    @patch("time.time", side_effect=[0, 10, 20, 30])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_failure(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
         mock_opensearch_client.transport.perform_request.side_effect = [
-            {'state': 'RUNNING'},
-            {'state': 'FAILED'}
+            {"state": "RUNNING"},
+            {"state": "FAILED"},
         ]
-        
-        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id')
+
+        result = self.custom_pytorch_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id"
+        )
         self.assertIsNone(result)
 
-    @patch('time.time', side_effect=[0, 1000])
-    @patch('time.sleep', return_value=None)
+    @patch("time.time", side_effect=[0, 1000])
+    @patch("time.sleep", return_value=None)
     def test_wait_for_model_registration_timeout(self, mock_sleep, mock_time):
         mock_opensearch_client = Mock()
-        mock_opensearch_client.transport.perform_request.return_value = {'state': 'RUNNING'}
-        
-        result = self.custom_pytorch_model.wait_for_model_registration(mock_opensearch_client, 'test-task-id', timeout=5)
+        mock_opensearch_client.transport.perform_request.return_value = {
+            "state": "RUNNING"
+        }
+
+        result = self.custom_pytorch_model.wait_for_model_registration(
+            mock_opensearch_client, "test-task-id", timeout=5
+        )
         self.assertIsNone(result)
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_ml_models/test_SageMakerModel.py b/tests/rag/test_ml_models/test_SageMakerModel.py
index f6443f4a..993b34f9 100644
--- a/tests/rag/test_ml_models/test_SageMakerModel.py
+++ b/tests/rag/test_ml_models/test_SageMakerModel.py
@@ -6,10 +6,12 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import Mock, patch, call
-import json
-from io import StringIO
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.SageMakerModel import SageMakerModel
+from unittest.mock import Mock, patch
+
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.ml_models.SageMakerModel import (
+    SageMakerModel,
+)
+
 
 class TestSageMakerModel(unittest.TestCase):
 
@@ -24,30 +26,43 @@ def setUp(self):
             self.opensearch_domain_name,
             self.opensearch_username,
             self.opensearch_password,
-            self.mock_iam_role_helper
+            self.mock_iam_role_helper,
         )
 
     def test_init(self):
         self.assertEqual(self.sagemaker_model.aws_region, self.aws_region)
-        self.assertEqual(self.sagemaker_model.opensearch_domain_name, self.opensearch_domain_name)
-        self.assertEqual(self.sagemaker_model.opensearch_username, self.opensearch_username)
-        self.assertEqual(self.sagemaker_model.opensearch_password, self.opensearch_password)
-        self.assertEqual(self.sagemaker_model.iam_role_helper, self.mock_iam_role_helper)
-
-    @patch('builtins.input', side_effect=[
-        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
-        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
-        ''  # Empty string for region, to use default
-    ])
+        self.assertEqual(
+            self.sagemaker_model.opensearch_domain_name, self.opensearch_domain_name
+        )
+        self.assertEqual(
+            self.sagemaker_model.opensearch_username, self.opensearch_username
+        )
+        self.assertEqual(
+            self.sagemaker_model.opensearch_password, self.opensearch_password
+        )
+        self.assertEqual(
+            self.sagemaker_model.iam_role_helper, self.mock_iam_role_helper
+        )
+
+    @patch(
+        "builtins.input",
+        side_effect=[
+            "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint",
+            "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations",
+            "",  # Empty string for region, to use default
+        ],
+    )
     def test_register_sagemaker_model(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_role.return_value = "test-connector-id"
         mock_helper.create_model.return_value = "test-model-id"
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+        self.sagemaker_model.register_sagemaker_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         # Check if create_connector_with_role was called
         mock_helper.create_connector_with_role.assert_called_once()
@@ -58,62 +73,85 @@ def test_register_sagemaker_model(self, mock_input):
         self.assertIn("my_test_create_sagemaker_connector_role", call_args)
 
         # Check the inline policy
-        inline_policy = next(arg for arg in call_args if isinstance(arg, dict) and 'Statement' in arg)
-        self.assertEqual(inline_policy['Statement'][0]['Action'], ["sagemaker:InvokeEndpoint"])
-        self.assertEqual(inline_policy['Statement'][0]['Resource'], 
-                        "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint")
+        inline_policy = next(
+            arg for arg in call_args if isinstance(arg, dict) and "Statement" in arg
+        )
+        self.assertEqual(
+            inline_policy["Statement"][0]["Action"], ["sagemaker:InvokeEndpoint"]
+        )
+        self.assertEqual(
+            inline_policy["Statement"][0]["Resource"],
+            "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint",
+        )
 
         # Check the connector input
-        connector_input = next(arg for arg in call_args if isinstance(arg, dict) and 'name' in arg)
-        self.assertEqual(connector_input['name'], "SageMaker Embedding Model Connector")
-        self.assertEqual(connector_input['parameters']['region'], "us-west-2")
-        self.assertEqual(connector_input['actions'][0]['url'], 
-                        "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations")
+        connector_input = next(
+            arg for arg in call_args if isinstance(arg, dict) and "name" in arg
+        )
+        self.assertEqual(connector_input["name"], "SageMaker Embedding Model Connector")
+        self.assertEqual(connector_input["parameters"]["region"], "us-west-2")
+        self.assertEqual(
+            connector_input["actions"][0]["url"],
+            "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations",
+        )
 
         # Check if create_model was called with correct arguments
         mock_helper.create_model.assert_called_once_with(
             "SageMaker Embedding Model",
             "SageMaker embedding model for semantic search",
             "test-connector-id",
-            "my_test_create_sagemaker_connector_role"
+            "my_test_create_sagemaker_connector_role",
         )
 
         # Check if config was saved correctly
-        mock_save_config.assert_called_once_with({'embedding_model_id': 'test-model-id'})
+        mock_save_config.assert_called_once_with(
+            {"embedding_model_id": "test-model-id"}
+        )
 
-    @patch('builtins.input', side_effect=[
-        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
-        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
-        ''  # Empty string for region, to use default
-    ])
+    @patch(
+        "builtins.input",
+        side_effect=[
+            "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint",
+            "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations",
+            "",  # Empty string for region, to use default
+        ],
+    )
     def test_register_sagemaker_model_connector_creation_failure(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_role.return_value = None
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+        self.sagemaker_model.register_sagemaker_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_helper.create_model.assert_not_called()
         mock_save_config.assert_not_called()
 
-    @patch('builtins.input', side_effect=[
-        'arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint',
-        'https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations',
-        ''  # Empty string for region, to use default
-    ])
+    @patch(
+        "builtins.input",
+        side_effect=[
+            "arn:aws:sagemaker:us-west-2:123456789012:endpoint/test-endpoint",
+            "https://runtime.sagemaker.us-west-2.amazonaws.com/endpoints/test-endpoint/invocations",
+            "",  # Empty string for region, to use default
+        ],
+    )
     def test_register_sagemaker_model_model_creation_failure(self, mock_input):
         mock_helper = Mock()
         mock_helper.create_connector_with_role.return_value = "test-connector-id"
         mock_helper.create_model.return_value = None
-        
+
         mock_config = {}
         mock_save_config = Mock()
 
-        self.sagemaker_model.register_sagemaker_model(mock_helper, mock_config, mock_save_config)
+        self.sagemaker_model.register_sagemaker_model(
+            mock_helper, mock_config, mock_save_config
+        )
 
         mock_save_config.assert_not_called()
 
-if __name__ == '__main__':
+
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_opensearch_connector.py b/tests/rag/test_opensearch_connector.py
index 331372a7..3334c7a0 100644
--- a/tests/rag/test_opensearch_connector.py
+++ b/tests/rag/test_opensearch_connector.py
@@ -6,29 +6,34 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import patch, MagicMock, Mock
-from opensearchpy import OpenSearch, AWSV4SignerAuth, exceptions as opensearch_exceptions
-from urllib.parse import urlparse
-from opensearchpy import RequestsHttpConnection
+from unittest.mock import MagicMock, Mock, patch
+
+from opensearchpy import AWSV4SignerAuth, RequestsHttpConnection
+from opensearchpy import exceptions as opensearch_exceptions
 
 # Adjust the import to match your project structure
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import OpenSearchConnector
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
+    OpenSearchConnector,
+)
+
 
 class TestOpenSearchConnector(unittest.TestCase):
     def setUp(self):
         # Sample configuration
         self.config = {
-            'region': 'us-east-1',
-            'index_name': 'test-index',
-            'is_serverless': 'False',
-            'opensearch_endpoint': 'https://search-example.us-east-1.es.amazonaws.com',
-            'opensearch_username': 'admin',
-            'opensearch_password': 'admin',
-            'service_type': 'managed',
+            "region": "us-east-1",
+            "index_name": "test-index",
+            "is_serverless": "False",
+            "opensearch_endpoint": "https://search-example.us-east-1.es.amazonaws.com",
+            "opensearch_username": "*****",
+            "opensearch_password": "*****",
+            "service_type": "managed",
         }
 
         # Update the patch target to match the actual import location
-        self.patcher_opensearch = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector.OpenSearch')
+        self.patcher_opensearch = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector.OpenSearch"
+        )
         self.MockOpenSearch = self.patcher_opensearch.start()
 
         # Mocked OpenSearch client instance
@@ -36,12 +41,14 @@ def setUp(self):
         self.MockOpenSearch.return_value = self.mock_opensearch_client
 
         # Patch boto3 Session
-        self.patcher_boto3_session = patch('boto3.Session')
+        self.patcher_boto3_session = patch("boto3.Session")
         self.MockBoto3Session = self.patcher_boto3_session.start()
 
         # Mocked boto3 credentials
         self.mock_credentials = Mock()
-        self.MockBoto3Session.return_value.get_credentials.return_value = self.mock_credentials
+        self.MockBoto3Session.return_value.get_credentials.return_value = (
+            self.mock_credentials
+        )
 
     def tearDown(self):
         self.patcher_opensearch.stop()
@@ -53,58 +60,92 @@ def test_initialize_opensearch_client_managed(self):
         self.assertTrue(result)
         self.MockOpenSearch.assert_called_once()
         self.MockOpenSearch.assert_called_with(
-            hosts=[{'host': 'search-example.us-east-1.es.amazonaws.com', 'port': 443}],
-            http_auth=('admin', 'admin'),
+            hosts=[{"host": "search-example.us-east-1.es.amazonaws.com", "port": 443}],
+            http_auth=("*****", "*****"),
             use_ssl=True,
-            verify_certs=False,
+            verify_certs=True,
+            ssl_show_warn=False,
             connection_class=RequestsHttpConnection,
-            pool_maxsize=20
+            pool_maxsize=20,
         )
 
     def test_initialize_opensearch_client_serverless(self):
-        self.config['service_type'] = 'serverless'
+        self.config["service_type"] = "serverless"
         connector = OpenSearchConnector(self.config)
         result = connector.initialize_opensearch_client()
         self.assertTrue(result)
         self.MockOpenSearch.assert_called_once()
         # Check that AWSV4SignerAuth is used
         args, kwargs = self.MockOpenSearch.call_args
-        self.assertIsInstance(kwargs['http_auth'], AWSV4SignerAuth)
+        self.assertIsInstance(kwargs["http_auth"], AWSV4SignerAuth)
 
     def test_initialize_opensearch_client_missing_endpoint(self):
-        self.config['opensearch_endpoint'] = ''
+        self.config["opensearch_endpoint"] = ""
         connector = OpenSearchConnector(self.config)
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             result = connector.initialize_opensearch_client()
             self.assertFalse(result)
-            mock_print.assert_called_with("OpenSearch endpoint not set. Please run setup first.")
+            mock_print.assert_called_with(
+                "OpenSearch endpoint not set. Please run setup first."
+            )
 
     def test_create_index_success(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        connector.create_index(embedding_dimension=768, space_type='cosinesimil')
+        connector.create_index(
+            embedding_dimension=768,
+            space_type="cosinesimil",
+            ef_construction=512,
+            number_of_shards=1,
+            number_of_replicas=1,
+            passage_text_field="passage_text",
+            passage_chunk_field="passage_chunk",
+            embedding_field="passage_embedding",
+        )
         self.mock_opensearch_client.indices.create.assert_called_once()
 
     def test_create_index_already_exists(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        # Simulate index already exists exception
-        self.mock_opensearch_client.indices.create.side_effect = opensearch_exceptions.RequestError(
-            '400', 'resource_already_exists_exception', 'Index already exists'
+        self.mock_opensearch_client.indices.create.side_effect = (
+            opensearch_exceptions.RequestError(
+                "400", "resource_already_exists_exception", "Index already exists"
+            )
         )
-        with patch('builtins.print') as mock_print:
-            connector.create_index(embedding_dimension=768, space_type='cosinesimil')
-            mock_print.assert_called_with(f"Index '{self.config['index_name']}' already exists.")
+        with patch("builtins.print") as mock_print:
+            connector.create_index(
+                embedding_dimension=768,
+                space_type="cosinesimil",
+                ef_construction=512,
+                number_of_shards=1,
+                number_of_replicas=1,
+                passage_text_field="passage_text",
+                passage_chunk_field="passage_chunk",
+                embedding_field="passage_embedding",
+            )
+            mock_print.assert_called_with(
+                f"Index '{self.config['index_name']}' already exists."
+            )
 
     def test_create_index_other_exception(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        # Simulate a different exception
-        self.mock_opensearch_client.indices.create.side_effect = opensearch_exceptions.RequestError(
-            '400', 'some_other_exception', 'Some other error'
+        self.mock_opensearch_client.indices.create.side_effect = (
+            opensearch_exceptions.RequestError(
+                400, "some_other_exception", "Some other error"
+            )
         )
-        with patch('builtins.print') as mock_print:
-            connector.create_index(embedding_dimension=768, space_type='cosinesimil')
+        with patch("builtins.print") as mock_print:
+            connector.create_index(
+                embedding_dimension=768,
+                space_type="cosinesimil",
+                ef_construction=512,
+                number_of_shards=1,
+                number_of_replicas=1,
+                passage_text_field="passage_text",
+                passage_chunk_field="passage_chunk",
+                embedding_field="passage_embedding",
+            )
             expected_message = f"Error creating index '{self.config['index_name']}': RequestError(400, 'some_other_exception')"
             mock_print.assert_called_with(expected_message)
 
@@ -112,82 +153,130 @@ def test_verify_and_create_index_exists(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
         self.mock_opensearch_client.indices.exists.return_value = True
-        with patch('builtins.print') as mock_print:
-            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+        with patch("builtins.print") as mock_print:
+            result = connector.verify_and_create_index(
+                embedding_dimension=768,
+                space_type="cosinesimil",
+                ef_construction=512,
+                number_of_shards=1,
+                number_of_replicas=1,
+                passage_text_field="passage_text",
+                passage_chunk_field="passage_chunk",
+                embedding_field="passage_embedding",
+            )
             self.assertTrue(result)
-            mock_print.assert_called_with(f"KNN index '{self.config['index_name']}' already exists.")
+            mock_print.assert_called_with(
+                f"KNN index '{self.config['index_name']}' already exists."
+            )
 
     def test_verify_and_create_index_not_exists(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
         self.mock_opensearch_client.indices.exists.return_value = False
-        with patch.object(connector, 'create_index') as mock_create_index:
-            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+        with patch.object(connector, "create_index") as mock_create_index:
+            result = connector.verify_and_create_index(
+                embedding_dimension=768,
+                space_type="cosinesimil",
+                ef_construction=512,
+                number_of_shards=1,
+                number_of_replicas=1,
+                passage_text_field="passage_text",
+                passage_chunk_field="passage_chunk",
+                embedding_field="passage_embedding",
+            )
             self.assertTrue(result)
-            mock_create_index.assert_called_once_with(768, 'cosinesimil')
+            mock_create_index.assert_called_once_with(
+                768,
+                "cosinesimil",
+                512,
+                1,
+                1,
+                "passage_text",
+                "passage_chunk",
+                "passage_embedding",
+            )
 
     def test_verify_and_create_index_exception(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        self.mock_opensearch_client.indices.exists.side_effect = Exception('Connection error')
-        with patch('builtins.print') as mock_print:
-            result = connector.verify_and_create_index(embedding_dimension=768, space_type='cosinesimil')
+        self.mock_opensearch_client.indices.exists.side_effect = Exception(
+            "Connection error"
+        )
+        with patch("builtins.print") as mock_print:
+            result = connector.verify_and_create_index(
+                embedding_dimension=768,
+                space_type="cosinesimil",
+                ef_construction=512,
+                number_of_shards=1,
+                number_of_replicas=1,
+                passage_text_field="passage_text",
+                passage_chunk_field="passage_chunk",
+                embedding_field="passage_embedding",
+            )
             self.assertFalse(result)
-            mock_print.assert_called_with("Error verifying or creating index: Connection error")
+            mock_print.assert_called_with(
+                "Error verifying or creating index: Connection error"
+            )
 
-    @patch('opensearchpy.helpers.bulk')
+    @patch("opensearchpy.helpers.bulk")
     def test_bulk_index_success(self, mock_bulk):
         mock_bulk.return_value = (100, [])
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
-        with patch('builtins.print') as mock_print:
+        actions = [{"index": {"_index": "test-index", "_id": i}} for i in range(100)]
+        with patch("builtins.print") as mock_print:
             success_count, error_count = connector.bulk_index(actions)
             self.assertEqual(success_count, 100)
             self.assertEqual(error_count, 0)
-            mock_print.assert_called_with("Indexed 100 documents successfully. Failed to index 0 documents.")
+            mock_print.assert_called_with(
+                "Indexed 100 documents successfully. Failed to index 0 documents."
+            )
 
-    @patch('opensearchpy.helpers.bulk')
+    @patch("opensearchpy.helpers.bulk")
     def test_bulk_index_with_errors(self, mock_bulk):
-        mock_bulk.return_value = (90, [{'index': {'_id': '10', 'error': 'Some error'}}])
+        mock_bulk.return_value = (90, [{"index": {"_id": "10", "error": "Some error"}}])
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
-        with patch('builtins.print') as mock_print:
+        actions = [{"index": {"_index": "test-index", "_id": i}} for i in range(100)]
+        with patch("builtins.print") as mock_print:
             success_count, error_count = connector.bulk_index(actions)
             self.assertEqual(success_count, 90)
             self.assertEqual(error_count, 1)
-            mock_print.assert_called_with("Indexed 90 documents successfully. Failed to index 1 documents.")
+            mock_print.assert_called_with(
+                "Indexed 90 documents successfully. Failed to index 1 documents."
+            )
 
-    @patch('opensearchpy.helpers.bulk')
+    @patch("opensearchpy.helpers.bulk")
     def test_bulk_index_exception(self, mock_bulk):
-        mock_bulk.side_effect = Exception('Bulk indexing error')
+        mock_bulk.side_effect = Exception("Bulk indexing error")
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        actions = [{'index': {'_index': 'test-index', '_id': i}} for i in range(100)]
-        with patch('builtins.print') as mock_print:
+        actions = [{"index": {"_index": "test-index", "_id": i}} for i in range(100)]
+        with patch("builtins.print") as mock_print:
             success_count, error_count = connector.bulk_index(actions)
             self.assertEqual(success_count, 0)
             self.assertEqual(error_count, 100)
-            mock_print.assert_called_with("Error during bulk indexing: Bulk indexing error")
+            mock_print.assert_called_with(
+                "Error during bulk indexing: Bulk indexing error"
+            )
 
     def test_search_success(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
         # Mock search response
         self.mock_opensearch_client.search.return_value = {
-            'hits': {'hits': [{'id': 1}, {'id': 2}]}
+            "hits": {"hits": [{"id": 1}, {"id": 2}]}
         }
-        results = connector.search(query_text='test', model_id='model-123', k=5)
-        self.assertEqual(results, [{'id': 1}, {'id': 2}])
+        results = connector.search(query_text="test", model_id="model-123", k=5)
+        self.assertEqual(results, [{"id": 1}, {"id": 2}])
         self.mock_opensearch_client.search.assert_called_once()
 
     def test_search_exception(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        self.mock_opensearch_client.search.side_effect = Exception('Search error')
-        with patch('builtins.print') as mock_print:
-            results = connector.search(query_text='test', model_id='model-123', k=5)
+        self.mock_opensearch_client.search.side_effect = Exception("Search error")
+        with patch("builtins.print") as mock_print:
+            results = connector.search(query_text="test", model_id="model-123", k=5)
             self.assertEqual(results, [])
             mock_print.assert_called_with("Error during search: Search error")
 
@@ -195,17 +284,19 @@ def test_search_by_vector_success(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
         self.mock_opensearch_client.search.return_value = {
-            'hits': {'hits': [{'id': 1}, {'id': 2}]}
+            "hits": {"hits": [{"id": 1}, {"id": 2}]}
         }
         results = connector.search_by_vector(vector=[0.1, 0.2, 0.3], k=5)
-        self.assertEqual(results, [{'id': 1}, {'id': 2}])
+        self.assertEqual(results, [{"id": 1}, {"id": 2}])
         self.mock_opensearch_client.search.assert_called_once()
 
     def test_search_by_vector_exception(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        self.mock_opensearch_client.search.side_effect = Exception('Vector search error')
-        with patch('builtins.print') as mock_print:
+        self.mock_opensearch_client.search.side_effect = Exception(
+            "Vector search error"
+        )
+        with patch("builtins.print") as mock_print:
             results = connector.search_by_vector(vector=[0.1, 0.2, 0.3], k=5)
             self.assertEqual(results, [])
             mock_print.assert_called_with("Error during search: Vector search error")
@@ -214,7 +305,9 @@ def test_check_connection_success(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
         # Mock info method
-        self.mock_opensearch_client.info.return_value = {'version': {'number': '7.10.2'}}
+        self.mock_opensearch_client.info.return_value = {
+            "version": {"number": "7.10.2"}
+        }
         result = connector.check_connection()
         self.assertTrue(result)
         self.mock_opensearch_client.info.assert_called_once()
@@ -222,11 +315,14 @@ def test_check_connection_success(self):
     def test_check_connection_failure(self):
         connector = OpenSearchConnector(self.config)
         connector.opensearch_client = self.mock_opensearch_client
-        self.mock_opensearch_client.info.side_effect = Exception('Connection error')
-        with patch('builtins.print') as mock_print:
+        self.mock_opensearch_client.info.side_effect = Exception("Connection error")
+        with patch("builtins.print") as mock_print:
             result = connector.check_connection()
             self.assertFalse(result)
-            mock_print.assert_called_with("Error connecting to OpenSearch: Connection error")
+            mock_print.assert_called_with(
+                "Error connecting to OpenSearch: Connection error"
+            )
+
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_query.py b/tests/rag/test_query.py
index 55d3bcb3..b9a7c321 100644
--- a/tests/rag/test_query.py
+++ b/tests/rag/test_query.py
@@ -5,206 +5,185 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
+import json
 import unittest
-from unittest.mock import patch, MagicMock
+from unittest.mock import MagicMock, patch
+
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.query import Query
-from opensearchpy import exceptions as opensearch_exceptions
-import json
+
 
 class TestQuery(unittest.TestCase):
     def setUp(self):
-        # Patch 'print' to suppress output during tests
-        self.print_patcher = patch('builtins.print')
+        self.print_patcher = patch("builtins.print")
         self.mock_print = self.print_patcher.start()
 
         self.config = {
-            'index_name': 'test-index',
-            'embedding_model_id': 'test-embedding-model-id',
-            'llm_model_id': 'test-llm-model-id',
-            'region': 'us-east-1',
-            'default_search_method': 'neural',
-            'llm_max_token_count': '1000',
-            'llm_temperature': '0.7',
-            'llm_top_p': '0.9',
-            'llm_stop_sequences': ''
+            "index_name": "test-index",
+            "embedding_model_id": "test-embedding-model-id",
+            "llm_model_id": "test-llm-model-id",
+            "region": "us-east-1",
+            "default_search_method": "neural",
+            "llm_max_token_count": "1000",
+            "llm_temperature": "0.7",
+            "llm_top_p": "0.9",
+            "llm_stop_sequences": "",
         }
-        # Do not instantiate Query here to avoid unmocked initialization.
 
     def tearDown(self):
-        # Stop the 'print' patcher
         self.print_patcher.stop()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
-    def test_initialize_clients_success(self, mock_boto3_client, mock_opensearch_connector):
-        # Mock OpenSearch client initialization
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.EmbeddingClient")
+    def test_initialize_clients_success(
+        self, mock_embedding_client, mock_boto3_client, mock_opensearch_connector
+    ):
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
         mock_opensearch_connector_instance.check_connection.return_value = True
 
-        # Mock Bedrock client initialization
         mock_bedrock_client = MagicMock()
         mock_boto3_client.return_value = mock_bedrock_client
 
-        # Initialize Query instance after patches
         query_instance = Query(self.config)
 
         self.assertIsNotNone(query_instance.opensearch)
         self.assertEqual(query_instance.bedrock_client, mock_bedrock_client)
         mock_opensearch_connector_instance.initialize_opensearch_client.assert_called_once()
-        mock_boto3_client.assert_called_once_with('bedrock-runtime', region_name='us-east-1')
+        mock_boto3_client.assert_called_once_with(
+            "bedrock-runtime", region_name="us-east-1"
+        )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
     def test_initialize_clients_opensearch_failure(self, mock_opensearch_connector):
-        # Mock OpenSearch client initialization failure
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = False
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            False
+        )
 
-        # Since 'print' is mocked in setUp, we can use 'self.mock_print' to assert calls
-        query_instance = Query(self.config)
-        mock_opensearch_connector_instance.initialize_opensearch_client.assert_called_once()
-        self.mock_print.assert_any_call("Failed to initialize OpenSearch client.")
-        self.mock_print.assert_any_call("Failed to initialize clients. Aborting.")
+        Query(self.config)
+        self.mock_print.assert_any_call(
+            "\x1b[31mFailed to initialize OpenSearch client.\x1b[0m"
+        )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
     def test_extract_relevant_sentences(self, mock_opensearch_connector):
-        # Mock OpenSearch client to prevent initialization
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
         query_instance = Query(self.config)
-        query_text = 'What is the capital of France?'
-        text = 'Paris is the capital of France. It is known for the Eiffel Tower.'
-        expected_sentences = ['Paris is the capital of France']
+        query_text = "What is the capital of France?"
+        text = "Paris is the capital of France. It is known for the Eiffel Tower."
+        expected_sentences = ["Paris is the capital of France"]
 
         result = query_instance.extract_relevant_sentences(query_text, text)
         self.assertIn(expected_sentences[0], result)
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
     def test_bulk_query_neural_success(self, mock_opensearch_connector):
-        # Mock OpenSearch client
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        queries = ['What is the capital of France?']
+        queries = ["What is the capital of France?"]
         mock_hits = [
-            {
-                '_score': 1.0,
-                '_source': {'content': 'Paris is the capital of France.'}
-            }
+            {"_score": 1.0, "_source": {"content": "Paris is the capital of France."}}
         ]
         query_instance = Query(self.config)
-        with patch.object(query_instance.opensearch, 'search', return_value=mock_hits):
+        with patch.object(query_instance.opensearch, "search", return_value=mock_hits):
             results = query_instance.bulk_query_neural(queries, k=1)
             self.assertEqual(len(results), 1)
-            self.assertEqual(results[0]['num_results'], 1)
-            self.assertEqual(results[0]['documents'][0]['source']['content'], 'Paris is the capital of France.')
+            self.assertEqual(results[0]["num_results"], 1)
+            self.assertEqual(
+                results[0]["documents"][0]["source"]["content"],
+                "Paris is the capital of France.",
+            )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
     def test_bulk_query_neural_failure(self, mock_opensearch_connector):
-        # Mock OpenSearch client
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        queries = ['What is the capital of France?']
+        queries = ["What is the capital of France?"]
         query_instance = Query(self.config)
-        with patch.object(query_instance.opensearch, 'search', side_effect=Exception('Search error')):
+        with patch.object(
+            query_instance.opensearch, "search", side_effect=Exception("Search error")
+        ):
             results = query_instance.bulk_query_neural(queries, k=1)
             self.assertEqual(len(results), 1)
-            self.assertEqual(results[0]['num_results'], 0)
-            self.mock_print.assert_any_call("\x1b[31mError performing search for query 'What is the capital of France?': Search error\x1b[0m")
+            self.assertEqual(results[0]["num_results"], 0)
+            self.mock_print.assert_any_call(
+                "\x1b[31mError performing search for query 'What is the capital of France?': Search error\x1b[0m"
+            )
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
     def test_bulk_query_semantic_success(self, mock_opensearch_connector):
-        # Mock OpenSearch client
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        queries = ['What is the capital of France?']
+        queries = ["What is the capital of France?"]
         embedding = [0.1, 0.2, 0.3]
         mock_hits = [
             {
-                '_score': 1.0,
-                '_source': {'nominee_text': 'Paris is the capital of France.'}
+                "_score": 1.0,
+                "_source": {"passage_chunk": ["Paris is the capital of France."]},
             }
         ]
         query_instance = Query(self.config)
-        with patch.object(query_instance, 'text_embedding', return_value=embedding):
-            with patch.object(query_instance.opensearch, 'search_by_vector', return_value=mock_hits):
-                results = query_instance.bulk_query_semantic(queries, k=1)
-                self.assertEqual(len(results), 1)
-                self.assertEqual(results[0]['num_results'], 1)
-                self.assertIn('Paris is the capital of France.', results[0]['context'])
-
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    def test_bulk_query_semantic_embedding_failure(self, mock_opensearch_connector):
-        # Mock OpenSearch client
-        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
-
-        queries = ['What is the capital of France?']
-        query_instance = Query(self.config)
-        with patch.object(query_instance, 'text_embedding', return_value=None):
+        query_instance.embedding_client = MagicMock()
+        query_instance.embedding_client.get_text_embedding.return_value = embedding
+        with patch.object(
+            query_instance.opensearch, "search_by_vector", return_value=mock_hits
+        ):
             results = query_instance.bulk_query_semantic(queries, k=1)
             self.assertEqual(len(results), 1)
-            self.assertEqual(results[0]['num_results'], 0)
-            self.mock_print.assert_any_call('\x1b[31mFailed to generate embedding for query: What is the capital of France?\x1b[0m')
-
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    def test_text_embedding_success(self, mock_opensearch_connector):
-        # Mock OpenSearch client
-        mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
-
-        text = 'Sample text'
-        embedding = [0.1, 0.2, 0.3]
-        response = {
-            'inference_results': [
-                {
-                    'output': [
-                        {'data': embedding}
-                    ]
-                }
-            ]
-        }
-        query_instance = Query(self.config)
-        with patch.object(query_instance.opensearch, 'opensearch_client') as mock_opensearch_client:
-            mock_opensearch_client.transport.perform_request.return_value = response
-
-            result = query_instance.text_embedding(text)
-            self.assertEqual(result, embedding)
-            mock_opensearch_client.transport.perform_request.assert_called_once()
+            self.assertEqual(results[0]["num_results"], 1)
+            self.assertIn("Paris is the capital of France.", results[0]["context"])
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    def test_text_embedding_failure(self, mock_opensearch_connector):
-        # Mock OpenSearch client
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
+    def test_bulk_query_semantic_embedding_failure(self, mock_opensearch_connector):
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        text = 'Sample text'
+        queries = ["What is the capital of France?"]
         query_instance = Query(self.config)
-        with patch.object(query_instance.opensearch, 'opensearch_client') as mock_opensearch_client:
-            mock_opensearch_client.transport.perform_request.side_effect = Exception('Test exception')
-
-            with self.assertRaises(Exception) as context:
-                query_instance.text_embedding(text, max_retries=1)
-            self.assertTrue('Test exception' in str(context.exception))
-            self.mock_print.assert_any_call('Error on attempt 1: Test exception')
-
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    def test_generate_answer_success(self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding):
-        # Mock OpenSearch client
+        query_instance.embedding_client = MagicMock()
+        query_instance.embedding_client.get_text_embedding.return_value = None
+        results = query_instance.bulk_query_semantic(queries, k=1)
+        self.assertEqual(len(results), 1)
+        self.assertEqual(results[0]["num_results"], 0)
+        self.mock_print.assert_any_call(
+            "\x1b[31mFailed to generate embedding for query: What is the capital of France?\x1b[0m"
+        )
+
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
+    def test_generate_answer_success(
+        self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding
+    ):
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        prompt = 'Sample prompt'
+        prompt = "Sample prompt"
         llm_config = {
-            'maxTokenCount': 100,
-            'temperature': 0.7,
-            'topP': 0.9,
-            'stopSequences': []
+            "maxTokenCount": 100,
+            "temperature": 0.7,
+            "topP": 0.9,
+            "stopSequences": [],
         }
         encoding_instance = MagicMock()
         encoding_instance.encode.return_value = [1, 2, 3]
@@ -213,35 +192,36 @@ def test_generate_answer_success(self, mock_opensearch_connector, mock_boto3_cli
 
         mock_bedrock_client = mock_boto3_client.return_value
         response_stream = MagicMock()
-        response_stream.read.return_value = json.dumps({
-            'results': [
-                {'outputText': 'Generated answer'}
-            ]
-        })
-        response = {'body': response_stream}
+        response_stream.read.return_value = json.dumps(
+            {"results": [{"outputText": "Generated answer"}]}
+        )
+        response = {"body": response_stream}
         mock_bedrock_client.invoke_model.return_value = response
 
         query_instance = Query(self.config)
-        query_instance.bedrock_client = mock_bedrock_client  # Set the mocked bedrock client
+        query_instance.bedrock_client = mock_bedrock_client
 
         answer = query_instance.generate_answer(prompt, llm_config)
-        self.assertEqual(answer, 'Generated answer')
+        self.assertEqual(answer, "Generated answer")
         mock_bedrock_client.invoke_model.assert_called_once()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector')
-    def test_generate_answer_failure(self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding):
-        # Mock OpenSearch client
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.tiktoken.get_encoding")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.boto3.client")
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.query.OpenSearchConnector")
+    def test_generate_answer_failure(
+        self, mock_opensearch_connector, mock_boto3_client, mock_get_encoding
+    ):
         mock_opensearch_connector_instance = mock_opensearch_connector.return_value
-        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = True
+        mock_opensearch_connector_instance.initialize_opensearch_client.return_value = (
+            True
+        )
 
-        prompt = 'Sample prompt'
+        prompt = "Sample prompt"
         llm_config = {
-            'maxTokenCount': 100,
-            'temperature': 0.7,
-            'topP': 0.9,
-            'stopSequences': []
+            "maxTokenCount": 100,
+            "temperature": 0.7,
+            "topP": 0.9,
+            "stopSequences": [],
         }
         encoding_instance = MagicMock()
         encoding_instance.encode.return_value = [1, 2, 3]
@@ -249,14 +229,17 @@ def test_generate_answer_failure(self, mock_opensearch_connector, mock_boto3_cli
         mock_get_encoding.return_value = encoding_instance
 
         mock_bedrock_client = mock_boto3_client.return_value
-        mock_bedrock_client.invoke_model.side_effect = Exception('LLM error')
+        mock_bedrock_client.invoke_model.side_effect = Exception("LLM error")
 
         query_instance = Query(self.config)
-        query_instance.bedrock_client = mock_bedrock_client  # Set the mocked bedrock client
+        query_instance.bedrock_client = mock_bedrock_client
 
         answer = query_instance.generate_answer(prompt, llm_config)
         self.assertIsNone(answer)
-        self.mock_print.assert_any_call('Error generating answer from LLM: LLM error')
+        self.mock_print.assert_any_call(
+            "\x1b[31mError generating answer from LLM: LLM error\x1b[0m"
+        )
+
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/rag/test_rag.py b/tests/rag/test_rag.py
index 3b96f010..8f646b92 100644
--- a/tests/rag/test_rag.py
+++ b/tests/rag/test_rag.py
@@ -5,13 +5,12 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import unittest
-from unittest.mock import patch, MagicMock, Mock
 import sys
-import argparse
-from io import StringIO
-from colorama import Fore, Style
+import unittest
 import warnings
+from io import StringIO
+from unittest.mock import patch
+
 from urllib3.exceptions import InsecureRequestWarning
 
 # Suppress specific warnings
@@ -22,109 +21,141 @@
 # Import the main function from rag.py
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag import main
 
+
 class TestRAGCLI(unittest.TestCase):
     def setUp(self):
         # Mock the config to avoid actual file operations
         self.mock_config = {
-            'service_type': 'managed',
-            'region': 'us-west-2',
-            'default_search_method': 'neural',
-            # ... other config parameters ...
+            "service_type": "managed",
+            "region": "us-west-2",
+            "default_search_method": "neural",
         }
 
         # Patch 'load_config' and 'save_config' functions
-        self.patcher_load_config = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.load_config', return_value=self.mock_config)
+        self.patcher_load_config = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.load_config",
+            return_value=self.mock_config,
+        )
         self.mock_load_config = self.patcher_load_config.start()
         self.addCleanup(self.patcher_load_config.stop)
 
-        self.patcher_save_config = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.save_config')
+        self.patcher_save_config = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.save_config"
+        )
         self.mock_save_config = self.patcher_save_config.start()
         self.addCleanup(self.patcher_save_config.stop)
 
         # Patch 'Setup', 'Ingest', and 'Query' classes
-        self.patcher_setup = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Setup')
+        self.patcher_setup = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Setup"
+        )
         self.mock_setup_class = self.patcher_setup.start()
         self.addCleanup(self.patcher_setup.stop)
 
-        self.patcher_ingest = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Ingest')
+        self.patcher_ingest = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Ingest"
+        )
         self.mock_ingest_class = self.patcher_ingest.start()
         self.addCleanup(self.patcher_ingest.stop)
 
-        self.patcher_query = patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Query')
+        self.patcher_query = patch(
+            "opensearch_py_ml.ml_commons.rag_pipeline.rag.rag.Query"
+        )
         self.mock_query_class = self.patcher_query.start()
         self.addCleanup(self.patcher_query.stop)
 
         # Capture stdout
         self.held_stdout = StringIO()
-        self.patcher_stdout = patch('sys.stdout', new=self.held_stdout)
+        self.patcher_stdout = patch("sys.stdout", new=self.held_stdout)
         self.patcher_stdout.start()
         self.addCleanup(self.patcher_stdout.stop)
 
         # Capture stderr
         self.held_stderr = StringIO()
-        self.patcher_stderr = patch('sys.stderr', new=self.held_stderr)
+        self.patcher_stderr = patch("sys.stderr", new=self.held_stderr)
         self.patcher_stderr.start()
         self.addCleanup(self.patcher_stderr.stop)
 
     def test_setup_command(self):
-        test_args = ['rag.py', 'setup']
-        with patch.object(sys, 'argv', test_args):
+        test_args = ["rag.py", "setup"]
+        with patch.object(sys, "argv", test_args):
             main()
             # Ensure Setup.setup_command() is called
             self.mock_setup_class.return_value.setup_command.assert_called_once()
             # Ensure save_config is called
-            self.mock_save_config.assert_called_once_with(self.mock_setup_class.return_value.config)
+            self.mock_save_config.assert_called_once_with(
+                self.mock_setup_class.return_value.config
+            )
 
     def test_ingest_command_with_paths(self):
-        test_args = ['rag.py', 'ingest', '--paths', '/path/to/data1', '/path/to/data2']
-        with patch.object(sys, 'argv', test_args):
+        test_args = ["rag.py", "ingest", "--paths", "/path/to/data1", "/path/to/data2"]
+        with patch.object(sys, "argv", test_args):
             main()
             # Ensure Ingest.ingest_command() is called with correct paths
             self.mock_ingest_class.assert_called_once_with(self.mock_config)
-            self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(['/path/to/data1', '/path/to/data2'])
+            self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(
+                ["/path/to/data1", "/path/to/data2"]
+            )
 
     def test_ingest_command_without_paths(self):
-        test_args = ['rag.py', 'ingest']
-        with patch.object(sys, 'argv', test_args):
-            with patch('rich.prompt.Prompt.ask', side_effect=['/path/to/data', '']):
+        test_args = ["rag.py", "ingest"]
+        with patch.object(sys, "argv", test_args):
+            with patch("rich.prompt.Prompt.ask", side_effect=["/path/to/data", ""]):
                 main()
                 # Ensure Ingest.ingest_command() is called with prompted paths
                 self.mock_ingest_class.assert_called_once_with(self.mock_config)
-                self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(['/path/to/data'])
+                self.mock_ingest_class.return_value.ingest_command.assert_called_once_with(
+                    ["/path/to/data"]
+                )
 
     def test_query_command_with_queries(self):
-        test_args = ['rag.py', 'query', '--queries', 'What is OpenSearch?', 'How does Bedrock work?']
-        with patch.object(sys, 'argv', test_args):
+        test_args = [
+            "rag.py",
+            "query",
+            "--queries",
+            "What is OpenSearch?",
+            "How does Bedrock work?",
+        ]
+        with patch.object(sys, "argv", test_args):
             main()
             # Ensure Query.query_command() is called with correct queries
             self.mock_query_class.assert_called_once_with(self.mock_config)
             self.mock_query_class.return_value.query_command.assert_called_once_with(
-                ['What is OpenSearch?', 'How does Bedrock work?'],
-                num_results=5
+                ["What is OpenSearch?", "How does Bedrock work?"], num_results=5
             )
 
     def test_query_command_without_queries(self):
-        test_args = ['rag.py', 'query']
-        with patch.object(sys, 'argv', test_args):
-            with patch('rich.prompt.Prompt.ask', side_effect=['What is OpenSearch?', '']):
+        test_args = ["rag.py", "query"]
+        with patch.object(sys, "argv", test_args):
+            with patch(
+                "rich.prompt.Prompt.ask", side_effect=["What is OpenSearch?", ""]
+            ):
                 main()
                 # Ensure Query.query_command() is called with prompted queries
                 self.mock_query_class.assert_called_once_with(self.mock_config)
-                self.mock_query_class.return_value.query_command.assert_called_once_with(['What is OpenSearch?'], num_results=5)
+                self.mock_query_class.return_value.query_command.assert_called_once_with(
+                    ["What is OpenSearch?"], num_results=5
+                )
 
     def test_query_command_with_num_results(self):
-        test_args = ['rag.py', 'query', '--queries', 'What is OpenSearch?', '--num_results', '3']
-        with patch.object(sys, 'argv', test_args):
+        test_args = [
+            "rag.py",
+            "query",
+            "--queries",
+            "What is OpenSearch?",
+            "--num_results",
+            "3",
+        ]
+        with patch.object(sys, "argv", test_args):
             main()
             # Ensure Query.query_command() is called with correct num_results
             self.mock_query_class.return_value.query_command.assert_called_once_with(
-                ['What is OpenSearch?'],
-                num_results=3
+                ["What is OpenSearch?"], num_results=3
             )
 
     def test_no_command(self):
-        test_args = ['rag.py']
-        with patch.object(sys, 'argv', test_args):
+        test_args = ["rag.py"]
+        with patch.object(sys, "argv", test_args):
             with self.assertRaises(SystemExit) as cm:
                 main()
             self.assertEqual(cm.exception.code, 1)
@@ -132,11 +163,13 @@ def test_no_command(self):
             stdout_output = self.held_stdout.getvalue()
             print("STDERR:", stderr_output)
             print("STDOUT:", stdout_output)
-            self.assertTrue("usage: rag.py" in stderr_output or "usage: rag.py" in stdout_output)
+            self.assertTrue(
+                "usage: rag.py" in stderr_output or "usage: rag.py" in stdout_output
+            )
 
     def test_invalid_command(self):
-        test_args = ['rag.py', 'invalid']
-        with patch.object(sys, 'argv', test_args):
+        test_args = ["rag.py", "invalid"]
+        with patch.object(sys, "argv", test_args):
             with self.assertRaises(SystemExit) as cm:
                 main()
             self.assertEqual(cm.exception.code, 2)
@@ -144,7 +177,11 @@ def test_invalid_command(self):
             stdout_output = self.held_stdout.getvalue()
             print("STDERR:", stderr_output)
             print("STDOUT:", stdout_output)
-            self.assertTrue("invalid choice: 'invalid'" in stderr_output or "invalid choice: 'invalid'" in stdout_output)
+            self.assertTrue(
+                "invalid choice: 'invalid'" in stderr_output
+                or "invalid choice: 'invalid'" in stdout_output
+            )
+
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
index 7ee990f9..0f98d567 100644
--- a/tests/rag/test_rag_setup.py
+++ b/tests/rag/test_rag_setup.py
@@ -5,188 +5,144 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import unittest
-from unittest.mock import patch, MagicMock
-import os
 import configparser
+import os
+import unittest
+from unittest.mock import MagicMock, patch
+
+# Adjust the import path to wherever Setup is actually defined
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup import Setup
-from colorama import Fore, Style
+
 
 class TestSetup(unittest.TestCase):
-    def setUp(self):
-        # Sample configuration
-        self.sample_config = {
-            'service_type': 'managed',
-            'region': 'us-west-2',
-            'iam_principal': 'arn:aws:iam::123456789012:user/test-user',
-            'collection_name': 'test-collection',
-            'opensearch_endpoint': 'https://search-hashim-test5.us-west-2.es.amazonaws.com',
-            'opensearch_username': '*****',
-            'opensearch_password': 'password',
-            'default_search_method': 'neural',
-            'index_name': 'test-index',
-            'embedding_dimension': '768',
-            'space_type': 'cosinesimil',
-            'ef_construction': '512',
-        }
 
-        # Initialize Setup instance
+    def setUp(self):
+        if os.path.exists(Setup.CONFIG_FILE):
+            os.remove(Setup.CONFIG_FILE)
         self.setup_instance = Setup()
 
-        # Set index_name for tests
-        self.setup_instance.index_name = self.sample_config['index_name']
-
-        # Mock AWS clients
-        self.mock_boto3_client = patch('boto3.client').start()
-        self.addCleanup(patch.stopall)
+    def tearDown(self):
+        if os.path.exists(Setup.CONFIG_FILE):
+            os.remove(Setup.CONFIG_FILE)
+
+    @patch("builtins.input", return_value="fake_input")
+    @patch("subprocess.run")
+    def test_configure_aws(self, mock_subprocess, mock_input):
+        with patch.object(
+            self.setup_instance,
+            "get_password_with_asterisks",
+            return_value="fake_secret",
+        ):
+            self.setup_instance.configure_aws()
+            self.assertEqual(mock_subprocess.call_count, 3)
 
-        # Mock OpenSearch client
-        self.mock_opensearch_client = MagicMock()
-        self.setup_instance.opensearch_client = self.mock_opensearch_client
-
-        # Mock os.path.exists
-        self.patcher_os_path_exists = patch('os.path.exists', return_value=True)
-        self.mock_os_path_exists = self.patcher_os_path_exists.start()
-        self.addCleanup(self.patcher_os_path_exists.stop)
-
-        # Mock configparser
-        self.patcher_configparser = patch('configparser.ConfigParser')
-        self.mock_configparser_class = self.patcher_configparser.start()
-        self.mock_configparser = MagicMock()
-        self.mock_configparser_class.return_value = self.mock_configparser
-        self.addCleanup(self.patcher_configparser.stop)
+    def test_load_config_no_file(self):
+        config = self.setup_instance.load_config()
+        self.assertEqual(config, {})
+
+    def test_load_config_with_file(self):
+        parser = configparser.ConfigParser()
+        parser["DEFAULT"] = {"region": "us-east-1", "service_type": "managed"}
+        with open(Setup.CONFIG_FILE, "w") as f:
+            parser.write(f)
+        config = self.setup_instance.load_config()
+        self.assertEqual(config.get("region"), "us-east-1")
+        self.assertEqual(config.get("service_type"), "managed")
+
+    @patch("sys.stdin")
+    @patch("sys.stdout")
+    def test_get_password_with_asterisks(self, mock_stdout, mock_stdin):
+        mock_stdin.fileno.return_value = 0
+        mock_stdin.read = MagicMock(side_effect=list("secret\n"))
+        pwd = self.setup_instance.get_password_with_asterisks("Enter password: ")
+        self.assertEqual(pwd, "secret")
+
+    @patch("builtins.input", side_effect=["2", "", "no", "2", ""])
+    def test_setup_configuration_open_source_no_auth(self, mock_input):
+        self.setup_instance.setup_configuration()
+        config = self.setup_instance.config
+        self.assertEqual(config["service_type"], "open-source")
+        self.assertEqual(config["opensearch_username"], "")
+        self.assertEqual(config["opensearch_password"], "")
+
+    @patch("boto3.client")
+    def test_initialize_clients_managed(self, mock_boto_client):
+        self.setup_instance.service_type = "managed"
+        self.setup_instance.aws_region = "us-west-2"
+        mock_boto_client.return_value = MagicMock()
+        result = self.setup_instance.initialize_clients()
+        self.assertTrue(result)
+
+    def test_initialize_clients_open_source(self):
+        self.setup_instance.service_type = "open-source"
+        result = self.setup_instance.initialize_clients()
+        self.assertTrue(result)
 
-    def test_load_config_existing(self):
-        with patch('os.path.exists', return_value=True):
-            self.mock_configparser.read.return_value = None
-            self.mock_configparser.__getitem__.return_value = self.sample_config
-            config = self.setup_instance.load_config()
-            self.assertEqual(config, self.sample_config)
+    def test_get_opensearch_domain_name(self):
+        self.setup_instance.opensearch_endpoint = (
+            "https://search-my-domain-name-abc123.us-west-2.es.amazonaws.com"
+        )
+        domain_name = self.setup_instance.get_opensearch_domain_name()
+        self.assertEqual(domain_name, "my-domain-name")
+
+    @patch("boto3.client")
+    def test_get_opensearch_domain_info(self, mock_boto_client):
+        mock_client = MagicMock()
+        mock_boto_client.return_value = mock_client
+        mock_client.describe_domain.return_value = {
+            "DomainStatus": {"Endpoint": "search-endpoint", "ARN": "test-arn"}
+        }
+        endpoint, arn = self.setup_instance.get_opensearch_domain_info(
+            "us-west-2", "mydomain"
+        )
+        self.assertEqual(endpoint, "search-endpoint")
+        self.assertEqual(arn, "test-arn")
 
-    def test_load_config_no_file(self):
-        with patch('os.path.exists', return_value=False):
-            self.mock_configparser.read.return_value = None
-            config = self.setup_instance.load_config()
-            self.assertEqual(config, {})
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup.OpenSearch")
+    def test_initialize_opensearch_client_managed(self, mock_opensearch):
+        self.setup_instance.service_type = "managed"
+        self.setup_instance.opensearch_endpoint = "https://test-domain:443"
+        self.setup_instance.opensearch_username = "admin"
+        self.setup_instance.opensearch_password = "pass"
+        result = self.setup_instance.initialize_opensearch_client()
+        self.assertTrue(result)
+        mock_opensearch.assert_called_once()
+
+    @patch("opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup.OpenSearch")
+    def test_initialize_opensearch_client_open_source_no_auth(self, mock_opensearch):
+        self.setup_instance.service_type = "open-source"
+        self.setup_instance.opensearch_endpoint = "http://localhost:9200"
+        self.setup_instance.opensearch_username = ""
+        self.setup_instance.opensearch_password = ""
+        result = self.setup_instance.initialize_opensearch_client()
+        self.assertTrue(result)
+        mock_opensearch.assert_called_once()
+
+    @patch("builtins.input", side_effect=["", "", "", "", "", "", "", ""])
+    def test_get_knn_index_details_all_defaults(self, mock_input):
+        details = self.setup_instance.get_knn_index_details()
+        self.assertEqual(
+            details,
+            (
+                768,
+                "l2",
+                512,
+                1,
+                2,
+                "passage_text",
+                "passage_chunk",
+                "passage_embedding",
+            ),
+        )
 
     def test_save_config(self):
-        with patch('builtins.open', unittest.mock.mock_open()) as mock_file:
-            self.setup_instance.save_config(self.sample_config)
-            mock_file.assert_called_with(self.setup_instance.CONFIG_FILE, 'w')
-            self.mock_configparser.write.assert_called()
+        config = {"key": "value", "another_key": "another_value"}
+        self.setup_instance.save_config(config)
+        parser = configparser.ConfigParser()
+        parser.read(Setup.CONFIG_FILE)
+        self.assertEqual(parser["DEFAULT"]["key"], "value")
+        self.assertEqual(parser["DEFAULT"]["another_key"], "another_value")
 
-    def test_get_opensearch_domain_name(self):
-        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
-            domain_name = self.setup_instance.get_opensearch_domain_name()
-            self.assertEqual(domain_name, 'hashim-test5')
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.rag_setup.OpenSearch')
-    def test_initialize_opensearch_client_managed(self, mock_opensearch):
-        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
-            self.setup_instance = Setup()
-            self.setup_instance.opensearch_username = '*****'
-            self.setup_instance.opensearch_password = 'password'
-            result = self.setup_instance.initialize_opensearch_client()
-            self.assertTrue(result)
-            mock_opensearch.assert_called_once()
-
-    def test_initialize_opensearch_client_no_endpoint(self):
-        self.setup_instance.opensearch_endpoint = ''
-        with patch('builtins.print') as mock_print:
-            result = self.setup_instance.initialize_opensearch_client()
-            self.assertFalse(result)
-            mock_print.assert_called_with(f"{Fore.RED}OpenSearch endpoint not set. Please run setup first.{Style.RESET_ALL}\n")
-
-    def test_verify_and_create_index_exists(self):
-        self.setup_instance.index_name = self.sample_config['index_name']
-        self.mock_opensearch_client.indices.exists.return_value = True
-        with patch('builtins.print') as mock_print:
-            result = self.setup_instance.verify_and_create_index(768, 'cosinesimil', 512)
-            self.assertTrue(result)
-            mock_print.assert_called_with(f"{Fore.GREEN}KNN index '{self.setup_instance.index_name}' already exists.{Style.RESET_ALL}\n")
-
-    def test_verify_and_create_index_create(self):
-        self.setup_instance.index_name = self.sample_config['index_name']
-        self.mock_opensearch_client.indices.exists.return_value = False
-        self.setup_instance.create_index = MagicMock()
-        with patch('builtins.print') as mock_print:
-            result = self.setup_instance.verify_and_create_index(768, 'cosinesimil', 512)
-            self.assertTrue(result)
-            self.setup_instance.create_index.assert_called_with(768, 'cosinesimil', 512)
-
-    def test_create_index_success(self):
-        with patch('builtins.print') as mock_print:
-            self.setup_instance.create_index(768, 'cosinesimil', 512)
-            self.mock_opensearch_client.indices.create.assert_called_once()
-            mock_print.assert_called_with(f"\n{Fore.GREEN}KNN index '{self.setup_instance.index_name}' created successfully with dimension 768, space type cosinesimil, and ef_construction 512.{Style.RESET_ALL}\n")
-
-    def test_create_index_already_exists(self):
-        self.mock_opensearch_client.indices.create.side_effect = Exception('resource_already_exists_exception')
-        with patch('builtins.print') as mock_print:
-            self.setup_instance.create_index(768, 'cosinesimil', 512)
-            mock_print.assert_called_with(f"\n{Fore.YELLOW}Index '{self.setup_instance.index_name}' already exists.{Style.RESET_ALL}\n")
-
-    def test_get_knn_index_details_default(self):
-        with patch('builtins.input', side_effect=['', '', '']):
-            with patch('builtins.print'):
-                embedding_dimension, space_type, ef_construction = self.setup_instance.get_knn_index_details()
-                self.assertEqual(embedding_dimension, 768)
-                self.assertEqual(space_type, 'l2')
-                self.assertEqual(ef_construction, 512)
-
-    def test_get_truncated_name_within_limit(self):
-        name = 'short-name'
-        truncated_name = self.setup_instance.get_truncated_name(name, max_length=32)
-        self.assertEqual(truncated_name, name)
-
-    def test_get_truncated_name_exceeds_limit(self):
-        name = 'a' * 35
-        truncated_name = self.setup_instance.get_truncated_name(name, max_length=32)
-        self.assertEqual(truncated_name, 'a' * 29 + '...')
-
-    def test_initialize_clients_success(self):
-        with patch.object(Setup, 'load_config', return_value=self.sample_config.copy()):
-            self.setup_instance = Setup()
-            self.setup_instance.service_type = 'managed'
-            with patch('boto3.client') as mock_boto_client:
-                mock_boto_client.return_value = MagicMock()
-                with patch('time.sleep'):
-                    with patch('builtins.print') as mock_print:
-                        result = self.setup_instance.initialize_clients()
-                        self.assertTrue(result)
-                        mock_print.assert_called_with(f"{Fore.GREEN}AWS clients initialized successfully.{Style.RESET_ALL}\n")
-
-    def test_initialize_clients_failure(self):
-        self.setup_instance.service_type = 'managed'
-        with patch('boto3.client', side_effect=Exception('Initialization failed')):
-            with patch('builtins.print') as mock_print:
-                result = self.setup_instance.initialize_clients()
-                self.assertFalse(result)
-                mock_print.assert_called_with(f"{Fore.RED}Failed to initialize AWS clients: Initialization failed{Style.RESET_ALL}")
-
-    def test_check_and_configure_aws_already_configured(self):
-        with patch('boto3.Session') as mock_session:
-            mock_session.return_value.get_credentials.return_value = MagicMock()
-            with patch('builtins.input', return_value='no'):
-                with patch('builtins.print') as mock_print:
-                    self.setup_instance.check_and_configure_aws()
-                    mock_print.assert_called_with("AWS credentials are already configured.")
-
-    def test_check_and_configure_aws_not_configured(self):
-        with patch('boto3.Session') as mock_session:
-            mock_session.return_value.get_credentials.return_value = None
-            self.setup_instance.configure_aws = MagicMock()
-            with patch('builtins.print'):
-                self.setup_instance.check_and_configure_aws()
-                self.setup_instance.configure_aws.assert_called_once()
-
-    def test_configure_aws(self):
-        with patch('builtins.input', side_effect=['AKIA...', 'SECRET...', 'us-west-2']):
-            with patch('subprocess.run') as mock_subprocess_run:
-                with patch('builtins.print') as mock_print:
-                    self.setup_instance.configure_aws()
-                    self.assertEqual(mock_subprocess_run.call_count, 3)
-                    mock_print.assert_called_with(f"{Fore.GREEN}AWS credentials have been successfully configured.{Style.RESET_ALL}")
-
-if __name__ == '__main__':
+if __name__ == "__main__":
     unittest.main()
diff --git a/tests/rag/test_serverless.py b/tests/rag/test_serverless.py
index 1792484a..c1ac97cd 100644
--- a/tests/rag/test_serverless.py
+++ b/tests/rag/test_serverless.py
@@ -6,16 +6,19 @@
 # GitHub history for details.
 
 import unittest
-from unittest.mock import patch, MagicMock, Mock
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless
+from unittest.mock import MagicMock, patch
+
 from colorama import Fore, Style
 
+from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless
+
+
 class TestServerless(unittest.TestCase):
     def setUp(self):
         # Sample data
-        self.collection_name = 'test-collection'
-        self.iam_principal = 'arn:aws:iam::123456789012:user/test-user'
-        self.aws_region = 'us-east-1'
+        self.collection_name = "test-collection"
+        self.iam_principal = "arn:aws:iam::123456789012:user/test-user"
+        self.aws_region = "us-east-1"
 
         # Mock aoss_client
         self.aoss_client = MagicMock()
@@ -33,19 +36,25 @@ class ConflictException(Exception):
             aoss_client=self.aoss_client,
             collection_name=self.collection_name,
             iam_principal=self.iam_principal,
-            aws_region=self.aws_region
+            aws_region=self.aws_region,
         )
 
         # Mock sleep to speed up tests
-        self.sleep_patcher = patch('time.sleep', return_value=None)
+        self.sleep_patcher = patch("time.sleep", return_value=None)
         self.mock_sleep = self.sleep_patcher.start()
 
     def tearDown(self):
         self.sleep_patcher.stop()
 
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_access_policy')
-    @patch('opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_security_policy')
-    def test_create_security_policies_success(self, mock_create_security_policy, mock_create_access_policy):
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_access_policy"
+    )
+    @patch(
+        "opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_security_policy"
+    )
+    def test_create_security_policies_success(
+        self, mock_create_security_policy, mock_create_access_policy
+    ):
         self.serverless.create_security_policies()
         # Check that create_security_policy is called twice (encryption and network)
         self.assertEqual(mock_create_security_policy.call_count, 2)
@@ -53,164 +62,191 @@ def test_create_security_policies_success(self, mock_create_security_policy, moc
         mock_create_access_policy.assert_called_once()
 
     def test_create_security_policy_success(self):
-        policy_type = 'encryption'
-        name = 'test-enc-policy'
-        description = 'Test encryption policy'
-        policy_body = '{}'
+        policy_type = "encryption"
+        name = "test-enc-policy"
+        description = "Test encryption policy"
+        policy_body = "{}"
         self.aoss_client.create_security_policy.return_value = {}
-        with patch('builtins.print') as mock_print:
-            self.serverless.create_security_policy(policy_type, name, description, policy_body)
+        with patch("builtins.print") as mock_print:
+            self.serverless.create_security_policy(
+                policy_type, name, description, policy_body
+            )
             self.aoss_client.create_security_policy.assert_called_with(
-                description=description,
-                name=name,
-                policy=policy_body,
-                type=policy_type
+                description=description, name=name, policy=policy_body, type=policy_type
+            )
+            mock_print.assert_called_with(
+                f"{Fore.GREEN}Encryption Policy '{name}' created successfully.{Style.RESET_ALL}"
             )
-            mock_print.assert_called_with(f"{Fore.GREEN}Encryption Policy '{name}' created successfully.{Style.RESET_ALL}")
 
     def test_create_security_policy_conflict(self):
-        policy_type = 'network'
-        name = 'test-net-policy'
-        description = 'Test network policy'
-        policy_body = '{}'
+        policy_type = "network"
+        name = "test-net-policy"
+        description = "Test network policy"
+        policy_body = "{}"
         # Simulate ConflictException
         conflict_exception = self.aoss_client.exceptions.ConflictException()
         self.aoss_client.create_security_policy.side_effect = conflict_exception
-        with patch('builtins.print') as mock_print:
-            self.serverless.create_security_policy(policy_type, name, description, policy_body)
-            mock_print.assert_called_with(f"{Fore.YELLOW}Network Policy '{name}' already exists.{Style.RESET_ALL}")
+        with patch("builtins.print") as mock_print:
+            self.serverless.create_security_policy(
+                policy_type, name, description, policy_body
+            )
+            mock_print.assert_called_with(
+                f"{Fore.YELLOW}Network Policy '{name}' already exists.{Style.RESET_ALL}"
+            )
 
     def test_create_security_policy_exception(self):
-        policy_type = 'invalid'
-        name = 'test-policy'
-        description = 'Test policy'
-        policy_body = '{}'
-        with patch('builtins.print') as mock_print:
-            self.serverless.create_security_policy(policy_type, name, description, policy_body)
-            mock_print.assert_called_with(f"{Fore.RED}Error creating {policy_type} policy '{name}': Invalid policy type specified.{Style.RESET_ALL}")
+        policy_type = "invalid"
+        name = "test-policy"
+        description = "Test policy"
+        policy_body = "{}"
+        with patch("builtins.print") as mock_print:
+            self.serverless.create_security_policy(
+                policy_type, name, description, policy_body
+            )
+            mock_print.assert_called_with(
+                f"{Fore.RED}Error creating {policy_type} policy '{name}': Invalid policy type specified.{Style.RESET_ALL}"
+            )
 
     def test_create_access_policy_success(self):
-        name = 'test-access-policy'
-        description = 'Test access policy'
-        policy_body = '{}'
+        name = "test-access-policy"
+        description = "Test access policy"
+        policy_body = "{}"
         self.aoss_client.create_access_policy.return_value = {}
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             self.serverless.create_access_policy(name, description, policy_body)
             self.aoss_client.create_access_policy.assert_called_with(
-                description=description,
-                name=name,
-                policy=policy_body,
-                type='data'
+                description=description, name=name, policy=policy_body, type="data"
+            )
+            mock_print.assert_called_with(
+                f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n"
             )
-            mock_print.assert_called_with(f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n")
 
     def test_create_access_policy_conflict(self):
-        name = 'test-access-policy'
-        description = 'Test access policy'
-        policy_body = '{}'
+        name = "test-access-policy"
+        description = "Test access policy"
+        policy_body = "{}"
         # Simulate ConflictException
         conflict_exception = self.aoss_client.exceptions.ConflictException()
         self.aoss_client.create_access_policy.side_effect = conflict_exception
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             self.serverless.create_access_policy(name, description, policy_body)
-            mock_print.assert_called_with(f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n")
+            mock_print.assert_called_with(
+                f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n"
+            )
 
     def test_create_collection_success(self):
         self.aoss_client.create_collection.return_value = {
-            'createCollectionDetail': {'id': 'collection-id-123'}
+            "createCollectionDetail": {"id": "collection-id-123"}
         }
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             collection_id = self.serverless.create_collection(self.collection_name)
-            self.assertEqual(collection_id, 'collection-id-123')
-            mock_print.assert_called_with(f"{Fore.GREEN}Collection '{self.collection_name}' creation initiated.{Style.RESET_ALL}")
+            self.assertEqual(collection_id, "collection-id-123")
+            mock_print.assert_called_with(
+                f"{Fore.GREEN}Collection '{self.collection_name}' creation initiated.{Style.RESET_ALL}"
+            )
 
     def test_create_collection_conflict(self):
         # Simulate ConflictException
         conflict_exception = self.aoss_client.exceptions.ConflictException()
         self.aoss_client.create_collection.side_effect = conflict_exception
-        self.serverless.get_collection_id = MagicMock(return_value='existing-collection-id')
-        with patch('builtins.print') as mock_print:
+        self.serverless.get_collection_id = MagicMock(
+            return_value="existing-collection-id"
+        )
+        with patch("builtins.print") as mock_print:
             collection_id = self.serverless.create_collection(self.collection_name)
-            self.assertEqual(collection_id, 'existing-collection-id')
-            mock_print.assert_called_with(f"{Fore.YELLOW}Collection '{self.collection_name}' already exists.{Style.RESET_ALL}")
+            self.assertEqual(collection_id, "existing-collection-id")
+            mock_print.assert_called_with(
+                f"{Fore.YELLOW}Collection '{self.collection_name}' already exists.{Style.RESET_ALL}"
+            )
 
     def test_create_collection_exception_retry(self):
         # Simulate Exception on first two attempts, success on third
         self.aoss_client.create_collection.side_effect = [
-            Exception('Temporary error'),
-            Exception('Temporary error'),
-            {'createCollectionDetail': {'id': 'collection-id-123'}}
+            Exception("Temporary error"),
+            Exception("Temporary error"),
+            {"createCollectionDetail": {"id": "collection-id-123"}},
         ]
-        with patch('builtins.print'):
-            collection_id = self.serverless.create_collection(self.collection_name, max_retries=3)
-            self.assertEqual(collection_id, 'collection-id-123')
+        with patch("builtins.print"):
+            collection_id = self.serverless.create_collection(
+                self.collection_name, max_retries=3
+            )
+            self.assertEqual(collection_id, "collection-id-123")
             self.assertEqual(self.aoss_client.create_collection.call_count, 3)
 
     def test_get_collection_id_success(self):
         self.aoss_client.list_collections.return_value = {
-            'collectionSummaries': [
-                {'name': 'other-collection', 'id': 'other-id'},
-                {'name': self.collection_name, 'id': 'collection-id-123'}
+            "collectionSummaries": [
+                {"name": "other-collection", "id": "other-id"},
+                {"name": self.collection_name, "id": "collection-id-123"},
             ]
         }
         collection_id = self.serverless.get_collection_id(self.collection_name)
-        self.assertEqual(collection_id, 'collection-id-123')
+        self.assertEqual(collection_id, "collection-id-123")
 
     def test_get_collection_id_not_found(self):
         self.aoss_client.list_collections.return_value = {
-            'collectionSummaries': [
-                {'name': 'other-collection', 'id': 'other-id'}
-            ]
+            "collectionSummaries": [{"name": "other-collection", "id": "other-id"}]
         }
         collection_id = self.serverless.get_collection_id(self.collection_name)
         self.assertIsNone(collection_id)
 
     def test_wait_for_collection_active_success(self):
-        collection_id = 'collection-id-123'
+        collection_id = "collection-id-123"
         # Simulate 'CREATING' status, then 'ACTIVE'
         self.aoss_client.batch_get_collection.side_effect = [
-            {'collectionDetails': [{'status': 'CREATING'}]},
-            {'collectionDetails': [{'status': 'ACTIVE'}]}
+            {"collectionDetails": [{"status": "CREATING"}]},
+            {"collectionDetails": [{"status": "ACTIVE"}]},
         ]
-        with patch('builtins.print'):
-            result = self.serverless.wait_for_collection_active(collection_id, max_wait_minutes=1)
+        with patch("builtins.print"):
+            result = self.serverless.wait_for_collection_active(
+                collection_id, max_wait_minutes=1
+            )
             self.assertTrue(result)
             self.assertEqual(self.aoss_client.batch_get_collection.call_count, 2)
 
     def test_wait_for_collection_active_timeout(self):
-        collection_id = 'collection-id-123'
+        collection_id = "collection-id-123"
         # Simulate 'CREATING' status indefinitely
-        self.aoss_client.batch_get_collection.return_value = {'collectionDetails': [{'status': 'CREATING'}]}
-        with patch('builtins.print'):
-            result = self.serverless.wait_for_collection_active(collection_id, max_wait_minutes=0.01)
+        self.aoss_client.batch_get_collection.return_value = {
+            "collectionDetails": [{"status": "CREATING"}]
+        }
+        with patch("builtins.print"):
+            result = self.serverless.wait_for_collection_active(
+                collection_id, max_wait_minutes=0.01
+            )
             self.assertFalse(result)
 
     def test_get_collection_endpoint_success(self):
-        collection_id = 'collection-id-123'
+        collection_id = "collection-id-123"
         self.serverless.get_collection_id = MagicMock(return_value=collection_id)
         self.aoss_client.batch_get_collection.return_value = {
-            'collectionDetails': [{'collectionEndpoint': 'https://example-endpoint.com'}]
+            "collectionDetails": [
+                {"collectionEndpoint": "https://example-endpoint.com"}
+            ]
         }
-        with patch('builtins.print'):
+        with patch("builtins.print"):
             endpoint = self.serverless.get_collection_endpoint()
-            self.assertEqual(endpoint, 'https://example-endpoint.com')
+            self.assertEqual(endpoint, "https://example-endpoint.com")
 
     def test_get_collection_endpoint_collection_not_found(self):
         self.serverless.get_collection_id = MagicMock(return_value=None)
-        with patch('builtins.print') as mock_print:
+        with patch("builtins.print") as mock_print:
             endpoint = self.serverless.get_collection_endpoint()
             self.assertIsNone(endpoint)
-            mock_print.assert_called_with(f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n")
+            mock_print.assert_called_with(
+                f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n"
+            )
 
     def test_get_truncated_name_within_limit(self):
-        name = 'short-name'
+        name = "short-name"
         truncated_name = self.serverless.get_truncated_name(name, max_length=32)
         self.assertEqual(truncated_name, name)
 
     def test_get_truncated_name_exceeds_limit(self):
-        name = 'a' * 35
+        name = "a" * 35
         truncated_name = self.serverless.get_truncated_name(name, max_length=32)
-        self.assertEqual(truncated_name, 'a' * 29 + '...')
+        self.assertEqual(truncated_name, "a" * 29 + "...")
+
 
-if __name__ == '__main__':
-    unittest.main()
\ No newline at end of file
+if __name__ == "__main__":
+    unittest.main()

From 6a846ce2c349633918c499d77b479ef8fea8f27f Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Wed, 11 Dec 2024 15:38:22 -0600
Subject: [PATCH 35/42] Deleted serverless.py from rag functionality as we are
 not using it

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 .../ml_commons/rag_pipeline/rag/serverless.py | 302 ------------------
 1 file changed, 302 deletions(-)
 delete mode 100644 opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py

diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
deleted file mode 100644
index cfcb2352..00000000
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/serverless.py
+++ /dev/null
@@ -1,302 +0,0 @@
-# SPDX-License-Identifier: Apache-2.0
-# The OpenSearch Contributors require contributions made to
-# this file be licensed under the Apache-2.0 license or a
-# compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
-
-import json
-import time
-
-from colorama import Fore, Style
-
-
-class Serverless:
-    def __init__(self, aoss_client, collection_name, iam_principal, aws_region):
-        """
-        Initialize the Serverless class with necessary AWS clients and configuration.
-
-        :param aoss_client: Boto3 client for OpenSearch Serverless
-        :param collection_name: Name of the OpenSearch collection
-        :param iam_principal: IAM Principal ARN
-        :param aws_region: AWS Region
-        """
-        self.aoss_client = aoss_client
-        self.collection_name = collection_name
-        self.iam_principal = iam_principal
-        self.aws_region = aws_region
-
-    def create_security_policies(self):
-        """
-        Create security policies for serverless OpenSearch.
-        """
-        encryption_policy = json.dumps(
-            {
-                "Rules": [
-                    {
-                        "Resource": [f"collection/{self.collection_name}"],
-                        "ResourceType": "collection",
-                    }
-                ],
-                "AWSOwnedKey": True,
-            }
-        )
-
-        network_policy = json.dumps(
-            [
-                {
-                    "Rules": [
-                        {
-                            "Resource": [f"collection/{self.collection_name}"],
-                            "ResourceType": "collection",
-                        }
-                    ],
-                    "AllowFromPublic": True,
-                }
-            ]
-        )
-
-        data_access_policy = json.dumps(
-            [
-                {
-                    "Rules": [
-                        {
-                            "Resource": ["collection/*"],
-                            "Permission": ["aoss:*"],
-                            "ResourceType": "collection",
-                        },
-                        {
-                            "Resource": ["index/*/*"],
-                            "Permission": ["aoss:*"],
-                            "ResourceType": "index",
-                        },
-                    ],
-                    "Principal": [self.iam_principal],
-                    "Description": f"Data access policy for {self.collection_name}",
-                }
-            ]
-        )
-
-        encryption_policy_name = self.get_truncated_name(
-            f"{self.collection_name}-enc-policy"
-        )
-        self.create_security_policy(
-            "encryption",
-            encryption_policy_name,
-            f"{self.collection_name} encryption security policy",
-            encryption_policy,
-        )
-        self.create_security_policy(
-            "network",
-            f"{self.collection_name}-net-policy",
-            f"{self.collection_name} network security policy",
-            network_policy,
-        )
-        self.create_access_policy(
-            self.get_truncated_name(f"{self.collection_name}-access-policy"),
-            f"{self.collection_name} data access policy",
-            data_access_policy,
-        )
-
-    def create_security_policy(self, policy_type, name, description, policy_body):
-        """
-        Create a specific security policy (encryption or network).
-
-        :param policy_type: Type of policy ('encryption' or 'network')
-        :param name: Name of the policy
-        :param description: Description of the policy
-        :param policy_body: JSON string of the policy
-        """
-        try:
-            if policy_type.lower() == "encryption":
-                self.aoss_client.create_security_policy(
-                    description=description,
-                    name=name,
-                    policy=policy_body,
-                    type="encryption",
-                )
-            elif policy_type.lower() == "network":
-                self.aoss_client.create_security_policy(
-                    description=description,
-                    name=name,
-                    policy=policy_body,
-                    type="network",
-                )
-            else:
-                raise ValueError("Invalid policy type specified.")
-            print(
-                f"{Fore.GREEN}{policy_type.capitalize()} Policy '{name}' created successfully.{Style.RESET_ALL}"
-            )
-        except self.aoss_client.exceptions.ConflictException:
-            print(
-                f"{Fore.YELLOW}{policy_type.capitalize()} Policy '{name}' already exists.{Style.RESET_ALL}"
-            )
-        except Exception as ex:
-            print(
-                f"{Fore.RED}Error creating {policy_type} policy '{name}': {ex}{Style.RESET_ALL}"
-            )
-
-    def create_access_policy(self, name, description, policy_body):
-        """
-        Create a data access policy.
-
-        :param name: Name of the access policy
-        :param description: Description of the access policy
-        :param policy_body: JSON string of the access policy
-        """
-        try:
-            self.aoss_client.create_access_policy(
-                description=description, name=name, policy=policy_body, type="data"
-            )
-            print(
-                f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n"
-            )
-        except self.aoss_client.exceptions.ConflictException:
-            print(
-                f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n"
-            )
-        except Exception as ex:
-            print(
-                f"{Fore.RED}Error creating data access policy '{name}': {ex}{Style.RESET_ALL}\n"
-            )
-
-    def create_collection(self, collection_name, max_retries=3):
-        """
-        Create an OpenSearch serverless collection.
-
-        :param collection_name: Name of the collection to create
-        :param max_retries: Maximum number of retries for creation
-        :return: Collection ID if successful, None otherwise
-        """
-        for attempt in range(max_retries):
-            try:
-                response = self.aoss_client.create_collection(
-                    description=f"{collection_name} collection",
-                    name=collection_name,
-                    type="VECTORSEARCH",
-                )
-                print(
-                    f"{Fore.GREEN}Collection '{collection_name}' creation initiated.{Style.RESET_ALL}"
-                )
-                return response["createCollectionDetail"]["id"]
-            except self.aoss_client.exceptions.ConflictException:
-                print(
-                    f"{Fore.YELLOW}Collection '{collection_name}' already exists.{Style.RESET_ALL}"
-                )
-                return self.get_collection_id(collection_name)
-            except Exception as ex:
-                print(
-                    f"{Fore.RED}Error creating collection '{collection_name}' (Attempt {attempt+1}/{max_retries}): {ex}{Style.RESET_ALL}"
-                )
-                if attempt == max_retries - 1:
-                    return None
-                time.sleep(5)
-        return None
-
-    def get_collection_id(self, collection_name):
-        """
-        Retrieve the ID of an existing collection.
-
-        :param collection_name: Name of the collection
-        :return: Collection ID if found, None otherwise
-        """
-        try:
-            response = self.aoss_client.list_collections()
-            for collection in response.get("collectionSummaries", []):
-                if collection.get("name") == collection_name:
-                    return collection.get("id")
-        except Exception as ex:
-            print(f"{Fore.RED}Error getting collection ID: {ex}{Style.RESET_ALL}")
-        return None
-
-    def wait_for_collection_active(self, collection_id, max_wait_minutes=30):
-        """
-        Wait for the collection to become active.
-
-        :param collection_id: ID of the collection
-        :param max_wait_minutes: Maximum wait time in minutes
-        :return: True if active, False otherwise
-        """
-        print(f"Waiting for collection '{self.collection_name}' to become active...")
-        start_time = time.time()
-        while time.time() - start_time < max_wait_minutes * 60:
-            try:
-                response = self.aoss_client.batch_get_collection(ids=[collection_id])
-                status = response["collectionDetails"][0]["status"]
-                if status == "ACTIVE":
-                    print(
-                        f"{Fore.GREEN}Collection '{self.collection_name}' is now active.{Style.RESET_ALL}\n"
-                    )
-                    return True
-                elif status in ["FAILED", "DELETED"]:
-                    print(
-                        f"{Fore.RED}Collection creation failed or was deleted. Status: {status}{Style.RESET_ALL}\n"
-                    )
-                    return False
-                else:
-                    print(f"Collection status: {status}. Waiting...")
-                    time.sleep(30)
-            except Exception as ex:
-                print(
-                    f"{Fore.RED}Error checking collection status: {ex}{Style.RESET_ALL}"
-                )
-                time.sleep(30)
-        print(
-            f"{Fore.RED}Timed out waiting for collection to become active after {max_wait_minutes} minutes.{Style.RESET_ALL}\n"
-        )
-        return False
-
-    def get_collection_endpoint(self):
-        """
-        Retrieve the endpoint URL for the OpenSearch collection.
-
-        :return: Collection endpoint URL if available, None otherwise
-        """
-        try:
-            collection_id = self.get_collection_id(self.collection_name)
-            if not collection_id:
-                print(
-                    f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n"
-                )
-                return None
-
-            batch_get_response = self.aoss_client.batch_get_collection(
-                ids=[collection_id]
-            )
-            collection_details = batch_get_response.get("collectionDetails", [])
-
-            if not collection_details:
-                print(
-                    f"{Fore.RED}No details found for collection ID '{collection_id}'.{Style.RESET_ALL}\n"
-                )
-                return None
-
-            endpoint = collection_details[0].get("collectionEndpoint")
-            if endpoint:
-                print(
-                    f"Collection '{self.collection_name}' has endpoint URL: {endpoint}\n"
-                )
-                return endpoint
-            else:
-                print(
-                    f"{Fore.RED}No endpoint URL found in collection '{self.collection_name}'.{Style.RESET_ALL}\n"
-                )
-                return None
-        except Exception as ex:
-            print(
-                f"{Fore.RED}Error retrieving collection endpoint: {ex}{Style.RESET_ALL}\n"
-            )
-            return None
-
-    @staticmethod
-    def get_truncated_name(base_name, max_length=32):
-        """
-        Truncate a name to fit within a specified length.
-
-        :param base_name: Original name
-        :param max_length: Maximum allowed length
-        :return: Truncated name
-        """
-        if len(base_name) <= max_length:
-            return base_name
-        return base_name[: max_length - 3] + "..."

From 6f17670713b5330a61288412b1c5bc6e12339750 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Thu, 12 Dec 2024 11:12:23 -0600
Subject: [PATCH 36/42] deleted unused dependcies, and test.py for serverless

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 tests/rag/test_serverless.py | 252 -----------------------------------
 1 file changed, 252 deletions(-)
 delete mode 100644 tests/rag/test_serverless.py

diff --git a/tests/rag/test_serverless.py b/tests/rag/test_serverless.py
deleted file mode 100644
index c1ac97cd..00000000
--- a/tests/rag/test_serverless.py
+++ /dev/null
@@ -1,252 +0,0 @@
-# SPDX-License-Identifier: Apache-2.0
-# The OpenSearch Contributors require contributions made to
-# this file be licensed under the Apache-2.0 license or a
-# compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
-
-import unittest
-from unittest.mock import MagicMock, patch
-
-from colorama import Fore, Style
-
-from opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless import Serverless
-
-
-class TestServerless(unittest.TestCase):
-    def setUp(self):
-        # Sample data
-        self.collection_name = "test-collection"
-        self.iam_principal = "arn:aws:iam::123456789012:user/test-user"
-        self.aws_region = "us-east-1"
-
-        # Mock aoss_client
-        self.aoss_client = MagicMock()
-
-        # Define a custom ConflictException class
-        class ConflictException(Exception):
-            pass
-
-        # Mock exceptions
-        self.aoss_client.exceptions = MagicMock()
-        self.aoss_client.exceptions.ConflictException = ConflictException
-
-        # Initialize the Serverless instance
-        self.serverless = Serverless(
-            aoss_client=self.aoss_client,
-            collection_name=self.collection_name,
-            iam_principal=self.iam_principal,
-            aws_region=self.aws_region,
-        )
-
-        # Mock sleep to speed up tests
-        self.sleep_patcher = patch("time.sleep", return_value=None)
-        self.mock_sleep = self.sleep_patcher.start()
-
-    def tearDown(self):
-        self.sleep_patcher.stop()
-
-    @patch(
-        "opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_access_policy"
-    )
-    @patch(
-        "opensearch_py_ml.ml_commons.rag_pipeline.rag.serverless.Serverless.create_security_policy"
-    )
-    def test_create_security_policies_success(
-        self, mock_create_security_policy, mock_create_access_policy
-    ):
-        self.serverless.create_security_policies()
-        # Check that create_security_policy is called twice (encryption and network)
-        self.assertEqual(mock_create_security_policy.call_count, 2)
-        # Check that create_access_policy is called once
-        mock_create_access_policy.assert_called_once()
-
-    def test_create_security_policy_success(self):
-        policy_type = "encryption"
-        name = "test-enc-policy"
-        description = "Test encryption policy"
-        policy_body = "{}"
-        self.aoss_client.create_security_policy.return_value = {}
-        with patch("builtins.print") as mock_print:
-            self.serverless.create_security_policy(
-                policy_type, name, description, policy_body
-            )
-            self.aoss_client.create_security_policy.assert_called_with(
-                description=description, name=name, policy=policy_body, type=policy_type
-            )
-            mock_print.assert_called_with(
-                f"{Fore.GREEN}Encryption Policy '{name}' created successfully.{Style.RESET_ALL}"
-            )
-
-    def test_create_security_policy_conflict(self):
-        policy_type = "network"
-        name = "test-net-policy"
-        description = "Test network policy"
-        policy_body = "{}"
-        # Simulate ConflictException
-        conflict_exception = self.aoss_client.exceptions.ConflictException()
-        self.aoss_client.create_security_policy.side_effect = conflict_exception
-        with patch("builtins.print") as mock_print:
-            self.serverless.create_security_policy(
-                policy_type, name, description, policy_body
-            )
-            mock_print.assert_called_with(
-                f"{Fore.YELLOW}Network Policy '{name}' already exists.{Style.RESET_ALL}"
-            )
-
-    def test_create_security_policy_exception(self):
-        policy_type = "invalid"
-        name = "test-policy"
-        description = "Test policy"
-        policy_body = "{}"
-        with patch("builtins.print") as mock_print:
-            self.serverless.create_security_policy(
-                policy_type, name, description, policy_body
-            )
-            mock_print.assert_called_with(
-                f"{Fore.RED}Error creating {policy_type} policy '{name}': Invalid policy type specified.{Style.RESET_ALL}"
-            )
-
-    def test_create_access_policy_success(self):
-        name = "test-access-policy"
-        description = "Test access policy"
-        policy_body = "{}"
-        self.aoss_client.create_access_policy.return_value = {}
-        with patch("builtins.print") as mock_print:
-            self.serverless.create_access_policy(name, description, policy_body)
-            self.aoss_client.create_access_policy.assert_called_with(
-                description=description, name=name, policy=policy_body, type="data"
-            )
-            mock_print.assert_called_with(
-                f"{Fore.GREEN}Data Access Policy '{name}' created successfully.{Style.RESET_ALL}\n"
-            )
-
-    def test_create_access_policy_conflict(self):
-        name = "test-access-policy"
-        description = "Test access policy"
-        policy_body = "{}"
-        # Simulate ConflictException
-        conflict_exception = self.aoss_client.exceptions.ConflictException()
-        self.aoss_client.create_access_policy.side_effect = conflict_exception
-        with patch("builtins.print") as mock_print:
-            self.serverless.create_access_policy(name, description, policy_body)
-            mock_print.assert_called_with(
-                f"{Fore.YELLOW}Data Access Policy '{name}' already exists.{Style.RESET_ALL}\n"
-            )
-
-    def test_create_collection_success(self):
-        self.aoss_client.create_collection.return_value = {
-            "createCollectionDetail": {"id": "collection-id-123"}
-        }
-        with patch("builtins.print") as mock_print:
-            collection_id = self.serverless.create_collection(self.collection_name)
-            self.assertEqual(collection_id, "collection-id-123")
-            mock_print.assert_called_with(
-                f"{Fore.GREEN}Collection '{self.collection_name}' creation initiated.{Style.RESET_ALL}"
-            )
-
-    def test_create_collection_conflict(self):
-        # Simulate ConflictException
-        conflict_exception = self.aoss_client.exceptions.ConflictException()
-        self.aoss_client.create_collection.side_effect = conflict_exception
-        self.serverless.get_collection_id = MagicMock(
-            return_value="existing-collection-id"
-        )
-        with patch("builtins.print") as mock_print:
-            collection_id = self.serverless.create_collection(self.collection_name)
-            self.assertEqual(collection_id, "existing-collection-id")
-            mock_print.assert_called_with(
-                f"{Fore.YELLOW}Collection '{self.collection_name}' already exists.{Style.RESET_ALL}"
-            )
-
-    def test_create_collection_exception_retry(self):
-        # Simulate Exception on first two attempts, success on third
-        self.aoss_client.create_collection.side_effect = [
-            Exception("Temporary error"),
-            Exception("Temporary error"),
-            {"createCollectionDetail": {"id": "collection-id-123"}},
-        ]
-        with patch("builtins.print"):
-            collection_id = self.serverless.create_collection(
-                self.collection_name, max_retries=3
-            )
-            self.assertEqual(collection_id, "collection-id-123")
-            self.assertEqual(self.aoss_client.create_collection.call_count, 3)
-
-    def test_get_collection_id_success(self):
-        self.aoss_client.list_collections.return_value = {
-            "collectionSummaries": [
-                {"name": "other-collection", "id": "other-id"},
-                {"name": self.collection_name, "id": "collection-id-123"},
-            ]
-        }
-        collection_id = self.serverless.get_collection_id(self.collection_name)
-        self.assertEqual(collection_id, "collection-id-123")
-
-    def test_get_collection_id_not_found(self):
-        self.aoss_client.list_collections.return_value = {
-            "collectionSummaries": [{"name": "other-collection", "id": "other-id"}]
-        }
-        collection_id = self.serverless.get_collection_id(self.collection_name)
-        self.assertIsNone(collection_id)
-
-    def test_wait_for_collection_active_success(self):
-        collection_id = "collection-id-123"
-        # Simulate 'CREATING' status, then 'ACTIVE'
-        self.aoss_client.batch_get_collection.side_effect = [
-            {"collectionDetails": [{"status": "CREATING"}]},
-            {"collectionDetails": [{"status": "ACTIVE"}]},
-        ]
-        with patch("builtins.print"):
-            result = self.serverless.wait_for_collection_active(
-                collection_id, max_wait_minutes=1
-            )
-            self.assertTrue(result)
-            self.assertEqual(self.aoss_client.batch_get_collection.call_count, 2)
-
-    def test_wait_for_collection_active_timeout(self):
-        collection_id = "collection-id-123"
-        # Simulate 'CREATING' status indefinitely
-        self.aoss_client.batch_get_collection.return_value = {
-            "collectionDetails": [{"status": "CREATING"}]
-        }
-        with patch("builtins.print"):
-            result = self.serverless.wait_for_collection_active(
-                collection_id, max_wait_minutes=0.01
-            )
-            self.assertFalse(result)
-
-    def test_get_collection_endpoint_success(self):
-        collection_id = "collection-id-123"
-        self.serverless.get_collection_id = MagicMock(return_value=collection_id)
-        self.aoss_client.batch_get_collection.return_value = {
-            "collectionDetails": [
-                {"collectionEndpoint": "https://example-endpoint.com"}
-            ]
-        }
-        with patch("builtins.print"):
-            endpoint = self.serverless.get_collection_endpoint()
-            self.assertEqual(endpoint, "https://example-endpoint.com")
-
-    def test_get_collection_endpoint_collection_not_found(self):
-        self.serverless.get_collection_id = MagicMock(return_value=None)
-        with patch("builtins.print") as mock_print:
-            endpoint = self.serverless.get_collection_endpoint()
-            self.assertIsNone(endpoint)
-            mock_print.assert_called_with(
-                f"{Fore.RED}Collection '{self.collection_name}' not found.{Style.RESET_ALL}\n"
-            )
-
-    def test_get_truncated_name_within_limit(self):
-        name = "short-name"
-        truncated_name = self.serverless.get_truncated_name(name, max_length=32)
-        self.assertEqual(truncated_name, name)
-
-    def test_get_truncated_name_exceeds_limit(self):
-        name = "a" * 35
-        truncated_name = self.serverless.get_truncated_name(name, max_length=32)
-        self.assertEqual(truncated_name, "a" * 29 + "...")
-
-
-if __name__ == "__main__":
-    unittest.main()

From 120169f2eddb0477edec9e6508cebb2679cce1e5 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 13 Dec 2024 09:23:16 -0600
Subject: [PATCH 37/42] Fixed failing test

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 setup.py                    | 2 --
 tests/rag/test_rag_setup.py | 5 ++++-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/setup.py b/setup.py
index 4130e165..13810501 100644
--- a/setup.py
+++ b/setup.py
@@ -88,8 +88,6 @@
         "numpy>=1.24.0,<2",
         "deprecated>=1.2.14,<2",
         # Additional dependencies for the RAG pipeline
-        "torch>=2.0.1,<2.1.0",
-        "onnx>=1.15.0",
         "accelerate>=0.27",
         "sentence_transformers>=2.5.0,<2.6",
         "tqdm>=4.66.0,<5",
diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
index 0f98d567..81de8952 100644
--- a/tests/rag/test_rag_setup.py
+++ b/tests/rag/test_rag_setup.py
@@ -49,10 +49,13 @@ def test_load_config_with_file(self):
         self.assertEqual(config.get("region"), "us-east-1")
         self.assertEqual(config.get("service_type"), "managed")
 
+    @patch("termios.tcsetattr")
+    @patch("termios.tcgetattr", return_value=[0,0,0,0,0,0])
     @patch("sys.stdin")
     @patch("sys.stdout")
-    def test_get_password_with_asterisks(self, mock_stdout, mock_stdin):
+    def test_get_password_with_asterisks(self, mock_stdout, mock_stdin, mock_tcgetattr, mock_tcsetattr):
         mock_stdin.fileno.return_value = 0
+        mock_stdin.isatty = MagicMock(return_value=True)
         mock_stdin.read = MagicMock(side_effect=list("secret\n"))
         pwd = self.setup_instance.get_password_with_asterisks("Enter password: ")
         self.assertEqual(pwd, "secret")

From 91c9af0a4e3d0db79f79371322139f8f190790ad Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 13 Dec 2024 10:11:47 -0600
Subject: [PATCH 38/42] Fixed tests

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 tests/rag/test_rag_setup.py | 10 ----------
 1 file changed, 10 deletions(-)

diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
index 81de8952..1db779ec 100644
--- a/tests/rag/test_rag_setup.py
+++ b/tests/rag/test_rag_setup.py
@@ -49,16 +49,6 @@ def test_load_config_with_file(self):
         self.assertEqual(config.get("region"), "us-east-1")
         self.assertEqual(config.get("service_type"), "managed")
 
-    @patch("termios.tcsetattr")
-    @patch("termios.tcgetattr", return_value=[0,0,0,0,0,0])
-    @patch("sys.stdin")
-    @patch("sys.stdout")
-    def test_get_password_with_asterisks(self, mock_stdout, mock_stdin, mock_tcgetattr, mock_tcsetattr):
-        mock_stdin.fileno.return_value = 0
-        mock_stdin.isatty = MagicMock(return_value=True)
-        mock_stdin.read = MagicMock(side_effect=list("secret\n"))
-        pwd = self.setup_instance.get_password_with_asterisks("Enter password: ")
-        self.assertEqual(pwd, "secret")
 
     @patch("builtins.input", side_effect=["2", "", "no", "2", ""])
     def test_setup_configuration_open_source_no_auth(self, mock_input):

From 82e69f56f5947b42e72dff5bbc1d405e9298db26 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Fri, 13 Dec 2024 14:58:31 -0600
Subject: [PATCH 39/42] Fixed tests

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 tests/rag/test_rag_setup.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/rag/test_rag_setup.py b/tests/rag/test_rag_setup.py
index 1db779ec..fc210995 100644
--- a/tests/rag/test_rag_setup.py
+++ b/tests/rag/test_rag_setup.py
@@ -49,7 +49,6 @@ def test_load_config_with_file(self):
         self.assertEqual(config.get("region"), "us-east-1")
         self.assertEqual(config.get("service_type"), "managed")
 
-
     @patch("builtins.input", side_effect=["2", "", "no", "2", ""])
     def test_setup_configuration_open_source_no_auth(self, mock_input):
         self.setup_instance.setup_configuration()

From c0114c355e68898d78bdd0fd65e06f32e460709b Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Tue, 7 Jan 2025 14:25:55 -0800
Subject: [PATCH 40/42] Addressed comments like making code less redudent, and
 combining methods

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/IAMRoleHelper.py  | 234 ++++++++----------
 opensearch_py_ml/ml_commons/SecretsHelper.py  |  86 +++----
 .../ml_commons/rag_pipeline/__init__.py       |   7 -
 .../ml_commons/rag_pipeline/rag/__init__.py   |   7 -
 .../ml_commons/rag_pipeline/rag/rag_setup.py  |  35 +++
 setup.py                                      |   1 +
 6 files changed, 174 insertions(+), 196 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
index 53feb1a8..1530b914 100644
--- a/opensearch_py_ml/ml_commons/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
@@ -2,10 +2,13 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors.
+# See GitHub history for details.
 
 import json
+import logging
+import uuid
+from datetime import datetime
 
 import boto3
 import requests
@@ -23,9 +26,6 @@ def __init__(
         opensearch_domain_url=None,
         opensearch_domain_username=None,
         opensearch_domain_password=None,
-        aws_user_name=None,
-        aws_role_name=None,
-        opensearch_domain_arn=None,
     ):
         """
         Initialize the IAMRoleHelper with AWS and OpenSearch configurations.
@@ -34,17 +34,14 @@ def __init__(
         :param opensearch_domain_url: URL of the OpenSearch domain.
         :param opensearch_domain_username: Username for OpenSearch domain authentication.
         :param opensearch_domain_password: Password for OpenSearch domain authentication.
-        :param aws_user_name: AWS IAM user name.
-        :param aws_role_name: AWS IAM role name.
-        :param opensearch_domain_arn: ARN of the OpenSearch domain.
         """
         self.region = region
         self.opensearch_domain_url = opensearch_domain_url
         self.opensearch_domain_username = opensearch_domain_username
         self.opensearch_domain_password = opensearch_domain_password
-        self.aws_user_name = aws_user_name
-        self.aws_role_name = aws_role_name
-        self.opensearch_domain_arn = opensearch_domain_arn
+
+        self.iam_client = boto3.client("iam", region_name=self.region)
+        self.sts_client = boto3.client("sts", region_name=self.region)
 
     def role_exists(self, role_name):
         """
@@ -53,17 +50,15 @@ def role_exists(self, role_name):
         :param role_name: Name of the IAM role.
         :return: True if the role exists, False otherwise.
         """
-        iam_client = boto3.client("iam")
-
         try:
-            iam_client.get_role(RoleName=role_name)
+            self.iam_client.get_role(RoleName=role_name)
             return True
         except ClientError as e:
             if e.response["Error"]["Code"] == "NoSuchEntity":
-                return False
+                print(f"The requested role '{role_name}' does not exist.")
             else:
                 print(f"An error occurred: {e}")
-                return False
+            return False
 
     def delete_role(self, role_name):
         """
@@ -71,53 +66,56 @@ def delete_role(self, role_name):
 
         :param role_name: Name of the IAM role to delete.
         """
-        iam_client = boto3.client("iam")
-
         try:
-            # Detach managed policies from the role
-            policies = iam_client.list_attached_role_policies(RoleName=role_name)[
+            # Detach any managed policies from the role
+            policies = self.iam_client.list_attached_role_policies(RoleName=role_name)[
                 "AttachedPolicies"
             ]
             for policy in policies:
-                iam_client.detach_role_policy(
+                self.iam_client.detach_role_policy(
                     RoleName=role_name, PolicyArn=policy["PolicyArn"]
                 )
-            print(f"All managed policies detached from role {role_name}.")
+            print(f"All managed policies detached from role '{role_name}'.")
 
             # Delete inline policies associated with the role
-            inline_policies = iam_client.list_role_policies(RoleName=role_name)[
+            inline_policies = self.iam_client.list_role_policies(RoleName=role_name)[
                 "PolicyNames"
             ]
             for policy_name in inline_policies:
-                iam_client.delete_role_policy(
+                self.iam_client.delete_role_policy(
                     RoleName=role_name, PolicyName=policy_name
                 )
-            print(f"All inline policies deleted from role {role_name}.")
+            print(f"All inline policies deleted from role '{role_name}'.")
 
             # Finally, delete the IAM role
-            iam_client.delete_role(RoleName=role_name)
-            print(f"Role {role_name} deleted.")
+            self.iam_client.delete_role(RoleName=role_name)
+            print(f"Role '{role_name}' deleted.")
 
         except ClientError as e:
             if e.response["Error"]["Code"] == "NoSuchEntity":
-                print(f"Role {role_name} does not exist.")
+                print(f"Role '{role_name}' does not exist.")
             else:
                 print(f"An error occurred: {e}")
 
-    def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
+    def create_iam_role(
+        self,
+        role_name,
+        trust_policy_json,
+        inline_policy_json,
+        policy_name=None,
+    ):
         """
         Create a new IAM role with specified trust and inline policies.
 
         :param role_name: Name of the IAM role to create.
         :param trust_policy_json: Trust policy document in JSON format.
         :param inline_policy_json: Inline policy document in JSON format.
+        :param policy_name: Optional. If not provided, a unique one will be generated.
         :return: ARN of the created role or None if creation failed.
         """
-        iam_client = boto3.client("iam")
-
         try:
             # Create the role with the provided trust policy
-            create_role_response = iam_client.create_role(
+            create_role_response = self.iam_client.create_role(
                 RoleName=role_name,
                 AssumeRolePolicyDocument=json.dumps(trust_policy_json),
                 Description="Role with custom trust and inline policies",
@@ -126,84 +124,75 @@ def create_iam_role(self, role_name, trust_policy_json, inline_policy_json):
             # Retrieve the ARN of the newly created role
             role_arn = create_role_response["Role"]["Arn"]
 
+            # If policy_name is not provided, generate a unique one
+            if not policy_name:
+                timestamp = datetime.utcnow().strftime('%Y%m%d%H%M%S')
+                policy_name = f"InlinePolicy-{role_name}-{timestamp}"
+
             # Attach the inline policy to the role
-            iam_client.put_role_policy(
+            self.iam_client.put_role_policy(
                 RoleName=role_name,
-                PolicyName="InlinePolicy",  # Replace with preferred policy name if needed
+                PolicyName=policy_name,
                 PolicyDocument=json.dumps(inline_policy_json),
             )
 
-            print(f"Created role: {role_name}")
+            print(f"Created role: {role_name} with inline policy: {policy_name}")
             return role_arn
 
         except ClientError as e:
             print(f"Error creating the role: {e}")
             return None
 
-    def get_role_arn(self, role_name):
+    def get_role_info(self, role_name, include_details=False):
         """
-        Retrieve the ARN of an IAM role.
+        Retrieve information about an IAM role.
 
         :param role_name: Name of the IAM role.
-        :return: ARN of the role or None if not found.
+        :param include_details: If False, returns only the role's ARN.
+                               If True, returns a dictionary with full role details.
+        :return: ARN or dict of role details. Returns None if not found.
         """
         if not role_name:
             return None
-        iam_client = boto3.client("iam")
-        try:
-            response = iam_client.get_role(RoleName=role_name)
-            return response["Role"]["Arn"]
-        except ClientError as e:
-            if e.response["Error"]["Code"] == "NoSuchEntity":
-                print(f"The requested role {role_name} does not exist")
-                return None
-            else:
-                print(f"An error occurred: {e}")
-                return None
-
-    def get_role_details(self, role_name):
-        """
-        Print detailed information about an IAM role.
-
-        :param role_name: Name of the IAM role.
-        """
-        iam = boto3.client("iam")
 
         try:
-            response = iam.get_role(RoleName=role_name)
+            response = self.iam_client.get_role(RoleName=role_name)
             role = response["Role"]
-
-            print(f"Role Name: {role['RoleName']}")
-            print(f"Role ID: {role['RoleId']}")
-            print(f"ARN: {role['Arn']}")
-            print(f"Creation Date: {role['CreateDate']}")
-            print("Assume Role Policy Document:")
-            print(
-                json.dumps(role["AssumeRolePolicyDocument"], indent=4, sort_keys=True)
+            role_arn = role["Arn"]
+
+            if not include_details:
+                return role_arn
+
+            # Build a detailed dictionary
+            role_details = {
+                "RoleName": role["RoleName"],
+                "RoleId": role["RoleId"],
+                "Arn": role_arn,
+                "CreationDate": role["CreateDate"],
+                "AssumeRolePolicyDocument": role["AssumeRolePolicyDocument"],
+                "InlinePolicies": {},
+            }
+
+            # List and retrieve any inline policies
+            list_role_policies_response = self.iam_client.list_role_policies(
+                RoleName=role_name
             )
-
-            # List and print all inline policies attached to the role
-            list_role_policies_response = iam.list_role_policies(RoleName=role_name)
-
             for policy_name in list_role_policies_response["PolicyNames"]:
-                get_role_policy_response = iam.get_role_policy(
+                get_role_policy_response = self.iam_client.get_role_policy(
                     RoleName=role_name, PolicyName=policy_name
                 )
-                print(f"Role Policy Name: {get_role_policy_response['PolicyName']}")
-                print("Role Policy Document:")
-                print(
-                    json.dumps(
-                        get_role_policy_response["PolicyDocument"],
-                        indent=4,
-                        sort_keys=True,
-                    )
-                )
+                role_details["InlinePolicies"][policy_name] = get_role_policy_response[
+                    "PolicyDocument"
+                ]
+
+            return role_details
 
         except ClientError as e:
             if e.response["Error"]["Code"] == "NoSuchEntity":
-                print(f"Role {role_name} does not exist.")
+                print(f"Role '{role_name}' does not exist.")
             else:
                 print(f"An error occurred: {e}")
+            return None
 
     def get_user_arn(self, username):
         """
@@ -214,29 +203,34 @@ def get_user_arn(self, username):
         """
         if not username:
             return None
-        iam_client = boto3.client("iam")
-
         try:
-            response = iam_client.get_user(UserName=username)
-            user_arn = response["User"]["Arn"]
-            return user_arn
+            response = self.iam_client.get_user(UserName=username)
+            return response["User"]["Arn"]
         except ClientError as e:
             if e.response["Error"]["Code"] == "NoSuchEntity":
                 print(f"IAM user '{username}' not found.")
-                return None
             else:
                 print(f"An error occurred: {e}")
-                return None
+            return None
 
-    def assume_role(self, role_arn, role_session_name="your_session_name"):
+    def assume_role(self, role_arn, role_session_name=None, session=None):
         """
         Assume an IAM role and obtain temporary security credentials.
 
         :param role_arn: ARN of the IAM role to assume.
         :param role_session_name: Identifier for the assumed role session.
-        :return: Temporary security credentials or None if the operation fails.
+        :param session: Optional boto3 session object. Defaults to the class-level sts_client.
+        :return: Dictionary with temporary security credentials and metadata, or None on failure.
         """
-        sts_client = boto3.client("sts")
+        if not role_arn:
+            logging.error("Role ARN is required.")
+            return None
+
+        # Use the provided session's STS client or fall back to the class-level sts_client
+        sts_client = session.client("sts") if session else self.sts_client
+
+        # Generate a default session name if none is provided
+        role_session_name = role_session_name or f"session-{uuid.uuid4()}"
 
         try:
             assumed_role_object = sts_client.assume_role(
@@ -244,48 +238,27 @@ def assume_role(self, role_arn, role_session_name="your_session_name"):
                 RoleSessionName=role_session_name,
             )
 
-            # Extract temporary credentials from the assumed role
             temp_credentials = assumed_role_object["Credentials"]
+            expiration = temp_credentials["Expiration"]
 
-            return temp_credentials
-        except ClientError as e:
-            print(f"Error assuming role: {e}")
-            return None
-
-    def map_iam_role_to_backend_role(self, iam_role_arn):
-        """
-        Map an IAM role to an OpenSearch backend role for access control.
-
-        :param iam_role_arn: ARN of the IAM role to map.
-        """
-        os_security_role = (
-            "ml_full_access"  # Defines the OpenSearch security role to map to
-        )
-        url = f"{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}"
-
-        payload = {"backend_roles": [iam_role_arn]}
-        headers = {"Content-Type": "application/json"}
-
-        try:
-            response = requests.put(
-                url,
-                auth=(self.opensearch_domain_username, self.opensearch_domain_password),
-                json=payload,
-                headers=headers,
-                verify=True,
+            logging.info(
+                f"Assumed role: {role_arn}. Temporary credentials valid until: {expiration}"
             )
 
-            if response.status_code == 200:
-                print(
-                    f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'."
-                )
-            else:
-                print(
-                    f"Failed to map IAM role to OpenSearch role '{os_security_role}'. Status code: {response.status_code}"
-                )
-                print(f"Response: {response.text}")
-        except requests.exceptions.RequestException as e:
-            print(f"HTTP request failed: {e}")
+            return {
+                "credentials": {
+                    "AccessKeyId": temp_credentials["AccessKeyId"],
+                    "SecretAccessKey": temp_credentials["SecretAccessKey"],
+                    "SessionToken": temp_credentials["SessionToken"],
+                },
+                "expiration": expiration,
+                "session_name": role_session_name,
+            }
+
+        except ClientError as e:
+            error_code = e.response["Error"]["Code"]
+            logging.error(f"Error assuming role {role_arn}: {error_code} - {e}")
+            return None
 
     def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
@@ -297,5 +270,4 @@ def get_iam_user_name_from_arn(self, iam_principal_arn):
         # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
         if iam_principal_arn and ":user/" in iam_principal_arn:
             return iam_principal_arn.split(":user/")[-1]
-        else:
-            return None
+        return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/SecretsHelper.py b/opensearch_py_ml/ml_commons/SecretsHelper.py
index bd3303e0..a828c80a 100644
--- a/opensearch_py_ml/ml_commons/SecretsHelper.py
+++ b/opensearch_py_ml/ml_commons/SecretsHelper.py
@@ -2,8 +2,8 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
+# Any modifications Copyright OpenSearch
+# Contributors. See GitHub history for details.
 
 import json
 import logging
@@ -18,29 +18,27 @@
 class SecretHelper:
     """
     Helper class for managing secrets in AWS Secrets Manager.
-    Provides methods to check existence, retrieve ARN, get secret values, and create new secrets.
+    Provides methods to check existence, retrieve details, and create secrets.
     """
 
     def __init__(self, region: str):
         """
         Initialize the SecretHelper with the specified AWS region.
-
         :param region: AWS region where the Secrets Manager is located.
         """
         self.region = region
+        # Create the Secrets Manager client once at the class level
+        self.secretsmanager = boto3.client("secretsmanager", region_name=self.region)
 
     def secret_exists(self, secret_name: str) -> bool:
         """
         Check if a secret with the given name exists in AWS Secrets Manager.
-
         :param secret_name: Name of the secret to check.
         :return: True if the secret exists, False otherwise.
         """
-        # Initialize the Secrets Manager client
-        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Attempt to retrieve the secret value
-            secretsmanager.get_secret_value(SecretId=secret_name)
+            self.secretsmanager.get_secret_value(SecretId=secret_name)
             return True
         except ClientError as e:
             # If the secret does not exist, return False
@@ -51,72 +49,58 @@ def secret_exists(self, secret_name: str) -> bool:
                 logger.error(f"An error occurred: {e}")
                 return False
 
-    def get_secret_arn(self, secret_name: str) -> str:
+    def get_secret_details(self, secret_name: str, fetch_value: bool = False) -> dict:
         """
-        Retrieve the ARN of a secret in AWS Secrets Manager.
+        Retrieve details of a secret from AWS Secrets Manager.
+        Optionally fetch the secret value as well.
 
         :param secret_name: Name of the secret.
-        :return: ARN of the secret if found, None otherwise.
+        :param fetch_value: Whether to also fetch the secret value (default is False).
+        :return: A dictionary with secret details (ARN and optionally the secret value)
+                 or an error dictionary if something went wrong.
         """
-        # Initialize the Secrets Manager client
-        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
-            # Describe the secret to get its details
-            response = secretsmanager.describe_secret(SecretId=secret_name)
-            return response["ARN"]
-        except ClientError as e:
-            # Handle the case where the secret does not exist
-            if e.response["Error"]["Code"] == "ResourceNotFoundException":
-                logger.warning(f"The requested secret {secret_name} was not found")
-                return None
-            else:
-                # Log other client errors and return None
-                logger.error(f"An error occurred: {e}")
-                return None
+            # Describe the secret to get its ARN and metadata
+            describe_response = self.secretsmanager.describe_secret(SecretId=secret_name)
 
-    def get_secret(self, secret_name: str) -> str:
-        """
-        Retrieve the secret value from AWS Secrets Manager.
+            secret_details = {
+                "ARN": describe_response["ARN"],
+                # You can add more fields from `describe_response` if needed
+            }
+
+            # Fetch the secret value if requested
+            if fetch_value:
+                value_response = self.secretsmanager.get_secret_value(SecretId=secret_name)
+                secret_details["SecretValue"] = value_response.get("SecretString")
+
+            return secret_details
 
-        :param secret_name: Name of the secret.
-        :return: Secret value as a string if found, None otherwise.
-        """
-        # Initialize the Secrets Manager client
-        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
-        try:
-            # Get the secret value
-            response = secretsmanager.get_secret_value(SecretId=secret_name)
-            return response.get("SecretString")
         except ClientError as e:
-            # Handle the case where the secret does not exist
-            if e.response["Error"]["Code"] == "ResourceNotFoundException":
-                logger.warning("The requested secret was not found")
-                return None
+            error_code = e.response["Error"]["Code"]
+            if error_code == "ResourceNotFoundException":
+                logger.warning(f"The requested secret '{secret_name}' was not found")
             else:
-                # Log other client errors and return None
-                logger.error(f"An error occurred: {e}")
-                return None
+                logger.error(f"An error occurred while fetching secret '{secret_name}': {e}")
+            # Return a dictionary with error details
+            return {"error": str(e), "error_code": error_code}
 
     def create_secret(self, secret_name: str, secret_value: dict) -> str:
         """
         Create a new secret in AWS Secrets Manager.
-
         :param secret_name: Name of the secret to create.
         :param secret_value: Dictionary containing the secret data.
         :return: ARN of the created secret if successful, None otherwise.
         """
-        # Initialize the Secrets Manager client
-        secretsmanager = boto3.client("secretsmanager", region_name=self.region)
         try:
             # Create the secret with the provided name and value
-            response = secretsmanager.create_secret(
+            response = self.secretsmanager.create_secret(
                 Name=secret_name,
                 SecretString=json.dumps(secret_value),
             )
             # Log success and return the secret's ARN
-            logger.info(f"Secret {secret_name} created successfully.")
+            logger.info(f"Secret '{secret_name}' created successfully.")
             return response["ARN"]
         except ClientError as e:
             # Log errors during secret creation and return None
-            logger.error(f"Error creating secret: {e}")
-            return None
+            logger.error(f"Error creating secret '{secret_name}': {e}")
+            return None
\ No newline at end of file
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
index 3a3fa0f8..8d89f258 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/__init__.py
@@ -4,10 +4,3 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-# SPDX-License-Identifier: Apache-2.0
-# The OpenSearch Contributors require contributions made to
-# this file be licensed under the Apache-2.0 license or a
-# compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
index 3a3fa0f8..8d89f258 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/__init__.py
@@ -4,10 +4,3 @@
 # compatible open source license.
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
-
-# SPDX-License-Identifier: Apache-2.0
-# The OpenSearch Contributors require contributions made to
-# this file be licensed under the Apache-2.0 license or a
-# compatible open source license.
-# Any modifications Copyright OpenSearch Contributors. See
-# GitHub history for details.
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 906abdf1..2ca32daf 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -18,6 +18,7 @@
 from botocore.config import Config
 from colorama import Fore, Style, init
 from opensearchpy import OpenSearch, RequestsHttpConnection
+import requests
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
@@ -832,3 +833,37 @@ def setup_command(self):
             print(
                 f"\n{Fore.RED}Failed to initialize OpenSearch client. Setup incomplete.{Style.RESET_ALL}\n"
             )
+
+    def map_iam_role_to_backend_role(self, iam_role_arn):
+        """
+        Map an IAM role to an OpenSearch backend role for access control.
+
+        :param iam_role_arn: ARN of the IAM role to map.
+        """
+        os_security_role = "ml_full_access"  # Example OpenSearch security role
+        url = f"{self.opensearch_domain_url}/_plugins/_security/api/rolesmapping/{os_security_role}"
+
+        payload = {"backend_roles": [iam_role_arn]}
+        headers = {"Content-Type": "application/json"}
+
+        try:
+            response = requests.put(
+                url,
+                auth=(self.opensearch_domain_username, self.opensearch_domain_password),
+                json=payload,
+                headers=headers,
+                verify=True,
+            )
+
+            if response.status_code == 200:
+                print(
+                    f"Successfully mapped IAM role to OpenSearch role '{os_security_role}'."
+                )
+            else:
+                print(
+                    f"Failed to map IAM role to OpenSearch role '{os_security_role}'. "
+                    f"Status code: {response.status_code}"
+                )
+                print(f"Response: {response.text}")
+        except requests.exceptions.RequestException as e:
+            print(f"HTTP request failed: {e}")
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 13810501..d9d4d468 100644
--- a/setup.py
+++ b/setup.py
@@ -88,6 +88,7 @@
         "numpy>=1.24.0,<2",
         "deprecated>=1.2.14,<2",
         # Additional dependencies for the RAG pipeline
+
         "accelerate>=0.27",
         "sentence_transformers>=2.5.0,<2.6",
         "tqdm>=4.66.0,<5",

From 197a134744eade8b4c7c1fe9d910349e9876fcef Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Tue, 7 Jan 2025 14:37:11 -0800
Subject: [PATCH 41/42] Addressed code comments, making code less redundent,
 and combining existing methods

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/IAMRoleHelper.py   |  9 ++++-----
 opensearch_py_ml/ml_commons/SecretsHelper.py   | 18 ++++++++++++------
 .../ml_commons/rag_pipeline/rag/rag_setup.py   |  4 ++--
 setup.py                                       |  1 -
 4 files changed, 18 insertions(+), 14 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
index 1530b914..9c8103c0 100644
--- a/opensearch_py_ml/ml_commons/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
@@ -2,8 +2,8 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch Contributors.
-# See GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
 
 import json
 import logging
@@ -11,7 +11,6 @@
 from datetime import datetime
 
 import boto3
-import requests
 from botocore.exceptions import ClientError
 
 
@@ -126,7 +125,7 @@ def create_iam_role(
 
             # If policy_name is not provided, generate a unique one
             if not policy_name:
-                timestamp = datetime.utcnow().strftime('%Y%m%d%H%M%S')
+                timestamp = datetime.utcnow().strftime("%Y%m%d%H%M%S")
                 policy_name = f"InlinePolicy-{role_name}-{timestamp}"
 
             # Attach the inline policy to the role
@@ -270,4 +269,4 @@ def get_iam_user_name_from_arn(self, iam_principal_arn):
         # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
         if iam_principal_arn and ":user/" in iam_principal_arn:
             return iam_principal_arn.split(":user/")[-1]
-        return None
\ No newline at end of file
+        return None
diff --git a/opensearch_py_ml/ml_commons/SecretsHelper.py b/opensearch_py_ml/ml_commons/SecretsHelper.py
index a828c80a..e35d6ff3 100644
--- a/opensearch_py_ml/ml_commons/SecretsHelper.py
+++ b/opensearch_py_ml/ml_commons/SecretsHelper.py
@@ -2,8 +2,8 @@
 # The OpenSearch Contributors require contributions made to
 # this file be licensed under the Apache-2.0 license or a
 # compatible open source license.
-# Any modifications Copyright OpenSearch
-# Contributors. See GitHub history for details.
+# Any modifications Copyright OpenSearch Contributors. See
+# GitHub history for details.
 
 import json
 import logging
@@ -61,7 +61,9 @@ def get_secret_details(self, secret_name: str, fetch_value: bool = False) -> dic
         """
         try:
             # Describe the secret to get its ARN and metadata
-            describe_response = self.secretsmanager.describe_secret(SecretId=secret_name)
+            describe_response = self.secretsmanager.describe_secret(
+                SecretId=secret_name
+            )
 
             secret_details = {
                 "ARN": describe_response["ARN"],
@@ -70,7 +72,9 @@ def get_secret_details(self, secret_name: str, fetch_value: bool = False) -> dic
 
             # Fetch the secret value if requested
             if fetch_value:
-                value_response = self.secretsmanager.get_secret_value(SecretId=secret_name)
+                value_response = self.secretsmanager.get_secret_value(
+                    SecretId=secret_name
+                )
                 secret_details["SecretValue"] = value_response.get("SecretString")
 
             return secret_details
@@ -80,7 +84,9 @@ def get_secret_details(self, secret_name: str, fetch_value: bool = False) -> dic
             if error_code == "ResourceNotFoundException":
                 logger.warning(f"The requested secret '{secret_name}' was not found")
             else:
-                logger.error(f"An error occurred while fetching secret '{secret_name}': {e}")
+                logger.error(
+                    f"An error occurred while fetching secret '{secret_name}': {e}"
+                )
             # Return a dictionary with error details
             return {"error": str(e), "error_code": error_code}
 
@@ -103,4 +109,4 @@ def create_secret(self, secret_name: str, secret_value: dict) -> str:
         except ClientError as e:
             # Log errors during secret creation and return None
             logger.error(f"Error creating secret '{secret_name}': {e}")
-            return None
\ No newline at end of file
+            return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
index 2ca32daf..b69779b7 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/rag_setup.py
@@ -15,10 +15,10 @@
 from urllib.parse import urlparse
 
 import boto3
+import requests
 from botocore.config import Config
 from colorama import Fore, Style, init
 from opensearchpy import OpenSearch, RequestsHttpConnection
-import requests
 
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.model_register import ModelRegister
 from opensearch_py_ml.ml_commons.rag_pipeline.rag.opensearch_connector import (
@@ -866,4 +866,4 @@ def map_iam_role_to_backend_role(self, iam_role_arn):
                 )
                 print(f"Response: {response.text}")
         except requests.exceptions.RequestException as e:
-            print(f"HTTP request failed: {e}")
\ No newline at end of file
+            print(f"HTTP request failed: {e}")
diff --git a/setup.py b/setup.py
index d9d4d468..13810501 100644
--- a/setup.py
+++ b/setup.py
@@ -88,7 +88,6 @@
         "numpy>=1.24.0,<2",
         "deprecated>=1.2.14,<2",
         # Additional dependencies for the RAG pipeline
-
         "accelerate>=0.27",
         "sentence_transformers>=2.5.0,<2.6",
         "tqdm>=4.66.0,<5",

From 220e9ee620a20081ce96e73e404246d82d9a3137 Mon Sep 17 00:00:00 2001
From: hmumtazz <hashimkmumtaz@gmail.com>
Date: Tue, 21 Jan 2025 00:00:27 -0800
Subject: [PATCH 42/42] Fixed methods at UT's, adressed comments

Signed-off-by: hmumtazz <hashimkmumtaz@gmail.com>
---
 opensearch_py_ml/ml_commons/IAMRoleHelper.py  |  20 +-
 .../rag_pipeline/rag/AIConnectorHelper.py     |  18 +-
 tests/rag/test_AiConnectorClass.py            |  10 +-
 tests/rag/test_IAMRoleHelper.py               | 440 +++++++++---------
 tests/rag/test_SecretsHelper.py               | 145 ++++--
 5 files changed, 361 insertions(+), 272 deletions(-)

diff --git a/opensearch_py_ml/ml_commons/IAMRoleHelper.py b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
index 9c8103c0..538297f4 100644
--- a/opensearch_py_ml/ml_commons/IAMRoleHelper.py
+++ b/opensearch_py_ml/ml_commons/IAMRoleHelper.py
@@ -39,7 +39,7 @@ def __init__(
         self.opensearch_domain_username = opensearch_domain_username
         self.opensearch_domain_password = opensearch_domain_password
 
-        self.iam_client = boto3.client("iam", region_name=self.region)
+        self.iam_client = boto3.client("iam")
         self.sts_client = boto3.client("sts", region_name=self.region)
 
     def role_exists(self, role_name):
@@ -225,10 +225,8 @@ def assume_role(self, role_arn, role_session_name=None, session=None):
             logging.error("Role ARN is required.")
             return None
 
-        # Use the provided session's STS client or fall back to the class-level sts_client
         sts_client = session.client("sts") if session else self.sts_client
 
-        # Generate a default session name if none is provided
         role_session_name = role_session_name or f"session-{uuid.uuid4()}"
 
         try:
@@ -263,10 +261,16 @@ def get_iam_user_name_from_arn(self, iam_principal_arn):
         """
         Extract the IAM user name from an IAM principal ARN.
 
-        :param iam_principal_arn: ARN of the IAM principal.
-        :return: IAM user name or None if extraction fails.
+        :param iam_principal_arn: ARN of the IAM principal. Expected format: arn:aws:iam::<account-id>:user/<user-name>
+        :return: IAM user name if extraction is successful, None otherwise.
         """
-        # IAM user ARN format: arn:aws:iam::123456789012:user/user-name
-        if iam_principal_arn and ":user/" in iam_principal_arn:
-            return iam_principal_arn.split(":user/")[-1]
+        try:
+            if (
+                iam_principal_arn
+                and iam_principal_arn.startswith("arn:aws:iam::")
+                and ":user/" in iam_principal_arn
+            ):
+                return iam_principal_arn.split(":user/")[-1]
+        except Exception as e:
+            print(f"Error extracting IAM user name: {e}")
         return None
diff --git a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
index 8d3d93de..5fe20939 100644
--- a/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
+++ b/opensearch_py_ml/ml_commons/rag_pipeline/rag/AIConnectorHelper.py
@@ -167,14 +167,17 @@ def create_connector(self, create_connector_role_name, payload):
         connector_id = response.get("connector_id")
         return connector_id
 
-    def get_task(self, task_id, create_connector_role_name):
+    def get_task(self, task_id, create_connector_role_name, wait_until_task_done=False):
         """
         Retrieve the status of a specific task using its ID.
-        Reusing the get_task_info method from MLCommonClient.
+        Reusing the get_task_info method from MLCommonClient and allowing
+        optional wait until the task completes.
         """
         try:
-            # No need to authenticate here again, ml_commons_client uses self.opensearch_client
-            task_response = self.ml_commons_client.get_task_info(task_id)
+            # No need to re-authenticate here; ml_commons_client uses self.opensearch_client
+            task_response = self.ml_commons_client.get_task_info(
+                task_id, wait_until_task_done
+            )
             print("Get Task Response:", json.dumps(task_response))
             return task_response
         except Exception as e:
@@ -232,10 +235,11 @@ def create_model(
             if "model_id" in response_data:
                 return response_data["model_id"]
             elif "task_id" in response_data:
-                # Handle asynchronous task
-                time.sleep(2)  # Wait for task to complete
+                # Handle asynchronous task by leveraging wait_until_task_done
                 task_response = self.get_task(
-                    response_data["task_id"], create_connector_role_name
+                    response_data["task_id"],
+                    create_connector_role_name,
+                    wait_until_task_done=True,
                 )
                 print("Task Response:", json.dumps(task_response))
                 if "model_id" in task_response:
diff --git a/tests/rag/test_AiConnectorClass.py b/tests/rag/test_AiConnectorClass.py
index e4776da5..65b08993 100644
--- a/tests/rag/test_AiConnectorClass.py
+++ b/tests/rag/test_AiConnectorClass.py
@@ -261,7 +261,9 @@ def test_create_model(self, mock_get_task, mock_get_ml_auth, mock_requests_post)
         # Instantiate helper
         with patch.object(AIConnectorHelper, "__init__", return_value=None):
             helper = AIConnectorHelper()
-            helper.opensearch_domain_url = f"https://{self.domain_endpoint}"
+            helper.opensearch_domain_url = (
+                "https://search-test-domain.us-east-1.es.amazonaws.com"
+            )
             helper.model_access_control = MagicMock()
             helper.model_access_control.get_model_group_id_by_name.return_value = (
                 "test-model-group-id"
@@ -276,7 +278,7 @@ def test_create_model(self, mock_get_task, mock_get_ml_auth, mock_requests_post)
                 deploy=True,
             )
 
-            # Assert that the correct URL was used
+            # Assert correct URL
             expected_url = f"{helper.opensearch_domain_url}/_plugins/_ml/models/_register?deploy=true"
             mock_requests_post.assert_called_once_with(
                 expected_url,
@@ -291,9 +293,9 @@ def test_create_model(self, mock_get_task, mock_get_ml_auth, mock_requests_post)
                 headers={"Content-Type": "application/json"},
             )
 
-            # Assert that get_task was called
+            # **Updated assertion** (include wait_until_task_done=True)
             mock_get_task.assert_called_once_with(
-                "test-task-id", "test-create-connector-role"
+                "test-task-id", "test-create-connector-role", wait_until_task_done=True
             )
 
             # Assert that model_id is returned
diff --git a/tests/rag/test_IAMRoleHelper.py b/tests/rag/test_IAMRoleHelper.py
index f0366dbd..7ae0e231 100644
--- a/tests/rag/test_IAMRoleHelper.py
+++ b/tests/rag/test_IAMRoleHelper.py
@@ -5,9 +5,8 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
-import json
-import logging
 import unittest
+from datetime import datetime, timedelta
 from unittest.mock import MagicMock, patch
 
 from botocore.exceptions import ClientError
@@ -16,290 +15,307 @@
 
 
 class TestIAMRoleHelper(unittest.TestCase):
-
     def setUp(self):
+        """
+        Create an IAMRoleHelper instance with mock configurations.
+        Patching boto3 clients so that no real AWS calls are made.
+        """
         self.region = "us-east-1"
-        self.iam_helper = IAMRoleHelper(region=self.region)
 
-        # Configure logging to suppress error logs during tests
-        logger = logging.getLogger("opensearch_py_ml.ml_commons.IAMRoleHelper")
-        logger.setLevel(logging.CRITICAL)  # Suppress logs below CRITICAL during tests
+        # Patches for the boto3 clients
+        self.patcher_iam = patch("boto3.client")
+        self.mock_boto_client = self.patcher_iam.start()
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_role_exists_true(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+        # Mock the IAM client and STS client
+        self.mock_iam_client = MagicMock()
+        self.mock_sts_client = MagicMock()
 
-        mock_iam_client.get_role.return_value = {"Role": {"RoleName": "test-role"}}
+        # Configure the mock_boto_client to return the respective mocks
+        self.mock_boto_client.side_effect = lambda service_name, region_name=None: {
+            "iam": self.mock_iam_client,
+            "sts": self.mock_sts_client,
+        }[service_name]
 
-        result = self.iam_helper.role_exists("test-role")
+        # Instantiate our class under test
+        self.helper = IAMRoleHelper(region=self.region)
 
-        self.assertTrue(result)
-        mock_iam_client.get_role.assert_called_with(RoleName="test-role")
+    def tearDown(self):
+        self.patcher_iam.stop()
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_role_exists_false(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+    def test_role_exists_found(self):
+        """Test role_exists returns True when role is found."""
+        # Mock successful get_role call
+        self.mock_iam_client.get_role.return_value = {
+            "Role": {"RoleName": "my-test-role"}
+        }
+
+        result = self.helper.role_exists("my-test-role")
+        self.assertTrue(result)
+        self.mock_iam_client.get_role.assert_called_once_with(RoleName="my-test-role")
 
+    def test_role_exists_not_found(self):
+        """Test role_exists returns False when role is not found."""
+        # Mock get_role call to raise NoSuchEntity
         error_response = {
-            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
+            "Error": {"Code": "NoSuchEntity", "Message": "Role not found"}
         }
-        mock_iam_client.get_role.side_effect = ClientError(error_response, "GetRole")
-
-        result = self.iam_helper.role_exists("nonexistent-role")
+        self.mock_iam_client.get_role.side_effect = ClientError(
+            error_response, "GetRole"
+        )
 
+        result = self.helper.role_exists("non-existent-role")
         self.assertFalse(result)
-        mock_iam_client.get_role.assert_called_with(RoleName="nonexistent-role")
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_delete_role_success(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+    def test_role_exists_other_error(self):
+        """Test role_exists returns False (and prints error) when another ClientError occurs."""
+        error_response = {
+            "Error": {"Code": "SomeOtherError", "Message": "Unexpected error"}
+        }
+        self.mock_iam_client.get_role.side_effect = ClientError(
+            error_response, "GetRole"
+        )
+
+        result = self.helper.role_exists("some-role")
+        self.assertFalse(result)
 
-        # Mock responses for list_attached_role_policies and list_role_policies
-        mock_iam_client.list_attached_role_policies.return_value = {
-            "AttachedPolicies": [{"PolicyArn": "arn:aws:iam::aws:policy/ExamplePolicy"}]
+    def test_delete_role_happy_path(self):
+        """Test delete_role successfully detaches and deletes a role."""
+        # Mock listing attached policies
+        self.mock_iam_client.list_attached_role_policies.return_value = {
+            "AttachedPolicies": [
+                {"PolicyArn": "arn:aws:iam::123456789012:policy/testPolicy"}
+            ]
         }
-        mock_iam_client.list_role_policies.return_value = {
-            "PolicyNames": ["InlinePolicy"]
+        # Mock listing inline policies
+        self.mock_iam_client.list_role_policies.return_value = {
+            "PolicyNames": ["InlinePolicyTest"]
         }
 
-        self.iam_helper.delete_role("test-role")
+        self.helper.delete_role("my-test-role")
 
-        mock_iam_client.detach_role_policy.assert_called_with(
-            RoleName="test-role", PolicyArn="arn:aws:iam::aws:policy/ExamplePolicy"
+        # Verify detach calls
+        self.mock_iam_client.detach_role_policy.assert_called_once_with(
+            RoleName="my-test-role",
+            PolicyArn="arn:aws:iam::123456789012:policy/testPolicy",
         )
-        mock_iam_client.delete_role_policy.assert_called_with(
-            RoleName="test-role", PolicyName="InlinePolicy"
+        # Verify delete inline policy call
+        self.mock_iam_client.delete_role_policy.assert_called_once_with(
+            RoleName="my-test-role", PolicyName="InlinePolicyTest"
+        )
+        # Verify delete_role call
+        self.mock_iam_client.delete_role.assert_called_once_with(
+            RoleName="my-test-role"
         )
-        mock_iam_client.delete_role.assert_called_with(RoleName="test-role")
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_delete_role_not_exist(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
 
+    def test_delete_role_no_such_entity(self):
+        """Test delete_role prints message if role does not exist."""
         error_response = {
-            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
+            "Error": {"Code": "NoSuchEntity", "Message": "Role not found"}
         }
-        mock_iam_client.list_attached_role_policies.side_effect = ClientError(
+        self.mock_iam_client.list_attached_role_policies.side_effect = ClientError(
             error_response, "ListAttachedRolePolicies"
         )
 
-        self.iam_helper.delete_role("nonexistent-role")
+        self.helper.delete_role("non-existent-role")
+        # We expect it to print a message, and not raise. The method should handle it.
 
-        mock_iam_client.list_attached_role_policies.assert_called_with(
-            RoleName="nonexistent-role"
+    def test_delete_role_other_error(self):
+        """Test delete_role prints error for unexpected ClientError."""
+        error_response = {
+            "Error": {"Code": "SomeOtherError", "Message": "Unexpected error"}
+        }
+        self.mock_iam_client.list_attached_role_policies.side_effect = ClientError(
+            error_response, "ListAttachedRolePolicies"
         )
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_create_iam_role_success(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+        self.helper.delete_role("some-role")
 
+    def test_create_iam_role_happy_path(self):
+        """Test create_iam_role creates a role with trust and inline policy."""
+        # Mock create_role response
+        self.mock_iam_client.create_role.return_value = {
+            "Role": {
+                "Arn": "arn:aws:iam::123456789012:role/my-test-role",
+                "RoleName": "my-test-role",
+            }
+        }
         trust_policy = {"Version": "2012-10-17", "Statement": []}
         inline_policy = {"Version": "2012-10-17", "Statement": []}
 
-        mock_iam_client.create_role.return_value = {
-            "Role": {"Arn": "arn:aws:iam::123456789012:role/test-role"}
-        }
-
-        role_arn = self.iam_helper.create_iam_role(
-            "test-role", trust_policy, inline_policy
+        role_arn = self.helper.create_iam_role(
+            role_name="my-test-role",
+            trust_policy_json=trust_policy,
+            inline_policy_json=inline_policy,
+            policy_name="myInlinePolicy",
         )
 
-        self.assertEqual(role_arn, "arn:aws:iam::123456789012:role/test-role")
-        mock_iam_client.create_role.assert_called_with(
-            RoleName="test-role",
-            AssumeRolePolicyDocument=json.dumps(trust_policy),
-            Description="Role with custom trust and inline policies",
-        )
-        mock_iam_client.put_role_policy.assert_called_with(
-            RoleName="test-role",
-            PolicyName="InlinePolicy",
-            PolicyDocument=json.dumps(inline_policy),
-        )
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_create_iam_role_error(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
-
-        trust_policy = {"Version": "2012-10-17", "Statement": []}
-        inline_policy = {"Version": "2012-10-17", "Statement": []}
+        # Verify calls
+        self.mock_iam_client.create_role.assert_called_once()
+        self.mock_iam_client.put_role_policy.assert_called_once()
+        self.assertEqual(role_arn, "arn:aws:iam::123456789012:role/my-test-role")
 
+    def test_create_iam_role_failure(self):
+        """Test create_iam_role returns None if creation fails."""
         error_response = {
-            "Error": {"Code": "EntityAlreadyExists", "Message": "Role already exists"}
+            "Error": {"Code": "SomeOtherError", "Message": "Role creation failure"}
         }
-        mock_iam_client.create_role.side_effect = ClientError(
+        self.mock_iam_client.create_role.side_effect = ClientError(
             error_response, "CreateRole"
         )
 
-        role_arn = self.iam_helper.create_iam_role(
-            "existing-role", trust_policy, inline_policy
-        )
+        trust_policy = {"Version": "2012-10-17", "Statement": []}
+        inline_policy = {"Version": "2012-10-17", "Statement": []}
 
-        self.assertIsNone(role_arn)
-        mock_iam_client.create_role.assert_called_with(
-            RoleName="existing-role",
-            AssumeRolePolicyDocument=json.dumps(trust_policy),
-            Description="Role with custom trust and inline policies",
+        role_arn = self.helper.create_iam_role(
+            role_name="my-test-role",
+            trust_policy_json=trust_policy,
+            inline_policy_json=inline_policy,
         )
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_get_role_arn_success(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
-
-        mock_iam_client.get_role.return_value = {
-            "Role": {"Arn": "arn:aws:iam::123456789012:role/test-role"}
+        self.assertIsNone(role_arn)
+        self.mock_iam_client.put_role_policy.assert_not_called()
+
+    def test_get_role_info_arn_only(self):
+        """Test get_role_info returns role ARN only when include_details=False."""
+        self.mock_iam_client.get_role.return_value = {
+            "Role": {
+                "RoleName": "my-test-role",
+                "Arn": "arn:aws:iam::123456789012:role/my-test-role",
+            }
         }
 
-        role_arn = self.iam_helper.get_role_arn("test-role")
-
-        self.assertEqual(role_arn, "arn:aws:iam::123456789012:role/test-role")
-        mock_iam_client.get_role.assert_called_with(RoleName="test-role")
+        arn = self.helper.get_role_info("my-test-role", include_details=False)
+        self.assertEqual(arn, "arn:aws:iam::123456789012:role/my-test-role")
+
+    def test_get_role_info_details(self):
+        """Test get_role_info returns detailed info when include_details=True."""
+        # Mock get_role
+        self.mock_iam_client.get_role.return_value = {
+            "Role": {
+                "RoleName": "my-test-role",
+                "RoleId": "AIDA12345EXAMPLE",
+                "Arn": "arn:aws:iam::123456789012:role/my-test-role",
+                "CreateDate": datetime(2020, 1, 1),
+                "AssumeRolePolicyDocument": {"Version": "2012-10-17", "Statement": []},
+            }
+        }
+        # Mock list_role_policies
+        self.mock_iam_client.list_role_policies.return_value = {
+            "PolicyNames": ["inlinePolicyTest"]
+        }
+        # Mock get_role_policy
+        self.mock_iam_client.get_role_policy.return_value = {
+            "PolicyDocument": {"Version": "2012-10-17", "Statement": []}
+        }
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_get_role_arn_not_found(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+        details = self.helper.get_role_info("my-test-role", include_details=True)
+        self.assertIsInstance(details, dict)
+        self.assertEqual(details["RoleName"], "my-test-role")
+        self.assertEqual(details["InlinePolicies"].keys(), {"inlinePolicyTest"})
 
+    def test_get_role_info_not_found(self):
+        """Test get_role_info returns None if role is not found."""
         error_response = {
-            "Error": {"Code": "NoSuchEntity", "Message": "Role does not exist"}
+            "Error": {"Code": "NoSuchEntity", "Message": "Role not found"}
         }
-        mock_iam_client.get_role.side_effect = ClientError(error_response, "GetRole")
-
-        role_arn = self.iam_helper.get_role_arn("nonexistent-role")
+        self.mock_iam_client.get_role.side_effect = ClientError(
+            error_response, "GetRole"
+        )
 
-        self.assertIsNone(role_arn)
-        mock_iam_client.get_role.assert_called_with(RoleName="nonexistent-role")
+        details = self.helper.get_role_info("non-existent-role", include_details=True)
+        self.assertIsNone(details)
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_get_user_arn_success(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+    def test_get_role_info_no_role_name(self):
+        """Test get_role_info returns None if role_name not provided."""
+        details = self.helper.get_role_info("", include_details=True)
+        self.assertIsNone(details)
 
-        mock_iam_client.get_user.return_value = {
-            "User": {"Arn": "arn:aws:iam::123456789012:user/test-user"}
+    def test_get_user_arn_success(self):
+        """Test get_user_arn returns ARN if user is found."""
+        self.mock_iam_client.get_user.return_value = {
+            "User": {
+                "Arn": "arn:aws:iam::123456789012:user/TestUser",
+                "UserName": "TestUser",
+            }
         }
 
-        user_arn = self.iam_helper.get_user_arn("test-user")
-
-        self.assertEqual(user_arn, "arn:aws:iam::123456789012:user/test-user")
-        mock_iam_client.get_user.assert_called_with(UserName="test-user")
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_get_user_arn_not_found(self, mock_boto_client):
-        mock_iam_client = MagicMock()
-        mock_boto_client.return_value = mock_iam_client
+        arn = self.helper.get_user_arn("TestUser")
+        self.assertEqual(arn, "arn:aws:iam::123456789012:user/TestUser")
 
+    def test_get_user_arn_not_found(self):
+        """Test get_user_arn returns None if user does not exist."""
         error_response = {
-            "Error": {"Code": "NoSuchEntity", "Message": "User does not exist"}
+            "Error": {"Code": "NoSuchEntity", "Message": "User not found"}
         }
-        mock_iam_client.get_user.side_effect = ClientError(error_response, "GetUser")
-
-        user_arn = self.iam_helper.get_user_arn("nonexistent-user")
-
-        self.assertIsNone(user_arn)
-        mock_iam_client.get_user.assert_called_with(UserName="nonexistent-user")
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_assume_role_success(self, mock_boto_client):
-        mock_sts_client = MagicMock()
-        mock_boto_client.return_value = mock_sts_client
+        self.mock_iam_client.get_user.side_effect = ClientError(
+            error_response, "GetUser"
+        )
 
-        mock_sts_client.assume_role.return_value = {
-            "Credentials": {
-                "AccessKeyId": "ASIA...",
-                "SecretAccessKey": "secret",
-                "SessionToken": "token",
-            }
+        arn = self.helper.get_user_arn("NonExistentUser")
+        self.assertIsNone(arn)
+
+    def test_get_user_arn_no_username(self):
+        """Test get_user_arn returns None if username not provided."""
+        arn = self.helper.get_user_arn("")
+        self.assertIsNone(arn)
+
+    def test_assume_role_happy_path(self):
+        """Test assume_role returns credentials on success."""
+        # Mock assume_role response
+        mock_credentials = {
+            "AccessKeyId": "AKIAEXAMPLE",
+            "SecretAccessKey": "SECRET",
+            "SessionToken": "TOKEN",
+            "Expiration": datetime.utcnow() + timedelta(hours=1),
+        }
+        self.mock_sts_client.assume_role.return_value = {
+            "Credentials": mock_credentials
         }
 
-        role_arn = "arn:aws:iam::123456789012:role/test-role"
-        credentials = self.iam_helper.assume_role(role_arn, "test-session")
-
-        self.assertIsNotNone(credentials)
-        self.assertEqual(credentials["AccessKeyId"], "ASIA...")
-        mock_sts_client.assume_role.assert_called_with(
-            RoleArn=role_arn,
-            RoleSessionName="test-session",
-        )
+        role_arn = "arn:aws:iam::123456789012:role/my-test-role"
+        response = self.helper.assume_role(role_arn, "test-session")
+        self.assertIsNotNone(response)
+        self.assertIn("credentials", response)
+        self.assertEqual(response["credentials"]["AccessKeyId"], "AKIAEXAMPLE")
 
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.boto3.client")
-    def test_assume_role_failure(self, mock_boto_client):
-        mock_sts_client = MagicMock()
-        mock_boto_client.return_value = mock_sts_client
+    def test_assume_role_no_arn(self):
+        """Test assume_role returns None if no ARN is provided."""
+        response = self.helper.assume_role(None, "test-session")
+        self.assertIsNone(response)
+        self.mock_sts_client.assume_role.assert_not_called()
 
+    def test_assume_role_failure(self):
+        """Test assume_role returns None if STS call fails."""
         error_response = {
             "Error": {
                 "Code": "AccessDenied",
-                "Message": "User is not authorized to perform: sts:AssumeRole",
+                "Message": "Not authorized to assume role",
             }
         }
-        mock_sts_client.assume_role.side_effect = ClientError(
+        self.mock_sts_client.assume_role.side_effect = ClientError(
             error_response, "AssumeRole"
         )
 
-        role_arn = "arn:aws:iam::123456789012:role/unauthorized-role"
-        credentials = self.iam_helper.assume_role(role_arn, "test-session")
-
-        self.assertIsNone(credentials)
-        mock_sts_client.assume_role.assert_called_with(
-            RoleArn=role_arn,
-            RoleSessionName="test-session",
-        )
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.requests.put")
-    def test_map_iam_role_to_backend_role_success(self, mock_put):
-        mock_response = MagicMock()
-        mock_response.status_code = 200
-        mock_put.return_value = mock_response
-
-        self.iam_helper.opensearch_domain_url = "https://search-domain"
-        self.iam_helper.opensearch_domain_username = "user"
-        self.iam_helper.opensearch_domain_password = "pass"
-
-        iam_role_arn = "arn:aws:iam::123456789012:role/test-role"
-
-        self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
-
-        mock_put.assert_called_once()
-        args, kwargs = mock_put.call_args
-        self.assertIn("/_plugins/_security/api/rolesmapping/ml_full_access", args[0])
-        self.assertEqual(kwargs["auth"], ("user", "pass"))
-        self.assertEqual(kwargs["json"], {"backend_roles": [iam_role_arn]})
-
-    @patch("opensearch_py_ml.ml_commons.IAMRoleHelper.requests.put")
-    def test_map_iam_role_to_backend_role_failure(self, mock_put):
-        mock_response = MagicMock()
-        mock_response.status_code = 403
-        mock_response.text = "Forbidden"
-        mock_put.return_value = mock_response
-
-        self.iam_helper.opensearch_domain_url = "https://search-domain"
-        self.iam_helper.opensearch_domain_username = "user"
-        self.iam_helper.opensearch_domain_password = "pass"
-
-        iam_role_arn = "arn:aws:iam::123456789012:role/test-role"
-
-        self.iam_helper.map_iam_role_to_backend_role(iam_role_arn)
-
-        mock_put.assert_called_once()
-        args, kwargs = mock_put.call_args
-        self.assertIn("/_plugins/_security/api/rolesmapping/ml_full_access", args[0])
+        role_arn = "arn:aws:iam::123456789012:role/my-test-role"
+        response = self.helper.assume_role(role_arn, "test-session")
+        self.assertIsNone(response)
 
     def test_get_iam_user_name_from_arn_valid(self):
-        iam_principal_arn = "arn:aws:iam::123456789012:user/test-user"
-        user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
-        self.assertEqual(user_name, "test-user")
-
-    def test_get_iam_user_name_from_arn_invalid(self):
-        iam_principal_arn = "arn:aws:iam::123456789012:role/test-role"
-        user_name = self.iam_helper.get_iam_user_name_from_arn(iam_principal_arn)
-        self.assertIsNone(user_name)
+        """Test get_iam_user_name_from_arn returns the username part of the ARN."""
+        arn = "arn:aws:iam::123456789012:user/MyUser"
+        username = self.helper.get_iam_user_name_from_arn(arn)
+        self.assertEqual(username, "MyUser")
+
+    def test_get_iam_user_name_from_arn_invalid_format(self):
+        """Test get_iam_user_name_from_arn returns None for invalid format."""
+        arn = "arn:aws:iam::123456789012:role/MyRole"
+        username = self.helper.get_iam_user_name_from_arn(arn)
+        self.assertIsNone(username)
+
+    def test_get_iam_user_name_from_arn_none_input(self):
+        """Test get_iam_user_name_from_arn returns None if input is None."""
+        username = self.helper.get_iam_user_name_from_arn(None)
+        self.assertIsNone(username)
 
 
 if __name__ == "__main__":
diff --git a/tests/rag/test_SecretsHelper.py b/tests/rag/test_SecretsHelper.py
index 9f2454e3..e671a465 100644
--- a/tests/rag/test_SecretsHelper.py
+++ b/tests/rag/test_SecretsHelper.py
@@ -5,6 +5,7 @@
 # Any modifications Copyright OpenSearch Contributors. See
 # GitHub history for details.
 
+
 import json
 import logging
 import unittest
@@ -22,6 +23,9 @@ def setUpClass(cls):
         # Suppress logging below ERROR level during tests
         logging.basicConfig(level=logging.ERROR)
 
+    # ------------------------------------------------------------------
+    # Test: create_secret
+    # ------------------------------------------------------------------
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
     def test_create_secret_error_logging(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
@@ -38,74 +42,84 @@ def test_create_secret_error_logging(self, mock_boto_client):
         )
 
         secret_helper = SecretHelper(region="us-east-1")
+        # Capture logs with a context manager
         with self.assertLogs(
             "opensearch_py_ml.ml_commons.SecretsHelper", level="ERROR"
         ) as cm:
             result = secret_helper.create_secret("new-secret", {"key": "value"})
             self.assertIsNone(result)
-        self.assertIn("Error creating secret", cm.output[0])
+        # Confirm the error message was logged
+        self.assertIn("Error creating secret 'new-secret'", cm.output[0])
 
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
-    def test_get_secret_arn_success(self, mock_boto_client):
+    def test_create_secret_success(self, mock_boto_client):
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
-        mock_secretsmanager.describe_secret.return_value = {
-            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
+        mock_secretsmanager.create_secret.return_value = {
+            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
         }
 
         secret_helper = SecretHelper(region="us-east-1")
-        result = secret_helper.get_secret_arn("my-secret")
+        result = secret_helper.create_secret("new-secret", {"key": "value"})
         self.assertEqual(
-            result, "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
+            result, "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
+        )
+        mock_secretsmanager.create_secret.assert_called_with(
+            Name="new-secret", SecretString=json.dumps({"key": "value"})
         )
-        mock_secretsmanager.describe_secret.assert_called_with(SecretId="my-secret")
 
+    # ------------------------------------------------------------------
+    # Test: secret_exists
+    # ------------------------------------------------------------------
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
-    def test_get_secret_arn_not_found(self, mock_boto_client):
+    def test_secret_exists_true(self, mock_boto_client):
+        """Test that secret_exists returns True if secret is found."""
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
-        error_response = {
-            "Error": {
-                "Code": "ResourceNotFoundException",
-                "Message": "Secret not found",
-            }
+        # If get_secret_value doesn't raise ResourceNotFoundException, assume secret exists
+        mock_secretsmanager.get_secret_value.return_value = {
+            "SecretString": "some-value"
         }
-        mock_secretsmanager.describe_secret.side_effect = ClientError(
-            error_response, "DescribeSecret"
-        )
 
         secret_helper = SecretHelper(region="us-east-1")
-        result = secret_helper.get_secret_arn("nonexistent-secret")
-        self.assertIsNone(result)
-        mock_secretsmanager.describe_secret.assert_called_with(
-            SecretId="nonexistent-secret"
+        exists = secret_helper.secret_exists("my-existing-secret")
+        self.assertTrue(exists)
+        mock_secretsmanager.get_secret_value.assert_called_with(
+            SecretId="my-existing-secret"
         )
 
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
-    def test_get_secret_success(self, mock_boto_client):
+    def test_secret_exists_false(self, mock_boto_client):
+        """Test that secret_exists returns False if secret is not found."""
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
-        mock_secretsmanager.get_secret_value.return_value = {
-            "SecretString": "my-secret-value"
+        error_response = {
+            "Error": {
+                "Code": "ResourceNotFoundException",
+                "Message": "Secret not found",
+            }
         }
+        mock_secretsmanager.get_secret_value.side_effect = ClientError(
+            error_response, "GetSecretValue"
+        )
 
         secret_helper = SecretHelper(region="us-east-1")
-        result = secret_helper.get_secret("my-secret")
-        self.assertEqual(result, "my-secret-value")
-        mock_secretsmanager.get_secret_value.assert_called_with(SecretId="my-secret")
+        exists = secret_helper.secret_exists("nonexistent-secret")
+        self.assertFalse(exists)
 
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
-    def test_get_secret_not_found(self, mock_boto_client):
+    def test_secret_exists_other_error(self, mock_boto_client):
+        """Test that secret_exists returns False on unexpected ClientError."""
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
         error_response = {
             "Error": {
-                "Code": "ResourceNotFoundException",
-                "Message": "Secret not found",
+                "Code": "InternalServiceError",
+                "Message": "An unspecified error occurred",
             }
         }
         mock_secretsmanager.get_secret_value.side_effect = ClientError(
@@ -113,28 +127,77 @@ def test_get_secret_not_found(self, mock_boto_client):
         )
 
         secret_helper = SecretHelper(region="us-east-1")
-        result = secret_helper.get_secret("nonexistent-secret")
-        self.assertIsNone(result)
-        mock_secretsmanager.get_secret_value.assert_called_with(
-            SecretId="nonexistent-secret"
-        )
+        exists = secret_helper.secret_exists("problem-secret")
+        self.assertFalse(exists)
 
+    # ------------------------------------------------------------------
+    # Test: get_secret_details
+    # ------------------------------------------------------------------
     @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
-    def test_create_secret_success(self, mock_boto_client):
+    def test_get_secret_details_arn_only_success(self, mock_boto_client):
+        """Test get_secret_details returns ARN if fetch_value=False."""
         mock_secretsmanager = MagicMock()
         mock_boto_client.return_value = mock_secretsmanager
 
-        mock_secretsmanager.create_secret.return_value = {
-            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
+        mock_secretsmanager.describe_secret.return_value = {
+            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
         }
 
         secret_helper = SecretHelper(region="us-east-1")
-        result = secret_helper.create_secret("new-secret", {"key": "value"})
+        details = secret_helper.get_secret_details("my-secret", fetch_value=False)
+        self.assertIn("ARN", details)
         self.assertEqual(
-            result, "arn:aws:secretsmanager:us-east-1:123456789012:secret:new-secret"
+            details["ARN"],
+            "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret",
         )
-        mock_secretsmanager.create_secret.assert_called_with(
-            Name="new-secret", SecretString=json.dumps({"key": "value"})
+        self.assertNotIn("SecretValue", details)
+        mock_secretsmanager.describe_secret.assert_called_with(SecretId="my-secret")
+
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
+    def test_get_secret_details_with_value_success(self, mock_boto_client):
+        """Test get_secret_details returns ARN and SecretValue if fetch_value=True."""
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        mock_secretsmanager.describe_secret.return_value = {
+            "ARN": "arn:aws:secretsmanager:us-east-1:123456789012:secret:my-secret"
+        }
+        mock_secretsmanager.get_secret_value.return_value = {
+            "SecretString": "my-secret-value"
+        }
+
+        secret_helper = SecretHelper(region="us-east-1")
+        details = secret_helper.get_secret_details("my-secret", fetch_value=True)
+        self.assertIn("ARN", details)
+        self.assertIn("SecretValue", details)
+        self.assertEqual(details["SecretValue"], "my-secret-value")
+        mock_secretsmanager.describe_secret.assert_called_with(SecretId="my-secret")
+        mock_secretsmanager.get_secret_value.assert_called_with(SecretId="my-secret")
+
+    @patch("opensearch_py_ml.ml_commons.SecretsHelper.boto3.client")
+    def test_get_secret_details_not_found(self, mock_boto_client):
+        """Test get_secret_details returns an error dict if secret is not found."""
+        mock_secretsmanager = MagicMock()
+        mock_boto_client.return_value = mock_secretsmanager
+
+        error_response = {
+            "Error": {
+                "Code": "ResourceNotFoundException",
+                "Message": "Secret not found",
+            }
+        }
+        mock_secretsmanager.describe_secret.side_effect = ClientError(
+            error_response, "DescribeSecret"
+        )
+
+        secret_helper = SecretHelper(region="us-east-1")
+        details = secret_helper.get_secret_details(
+            "nonexistent-secret", fetch_value=True
+        )
+        self.assertIn("error", details)
+        self.assertEqual(details["error_code"], "ResourceNotFoundException")
+        mock_secretsmanager.describe_secret.assert_called_with(
+            SecretId="nonexistent-secret"
         )