rootflo · vishnurk6247 · Dec 19, 2025 · Dec 16, 2025 · Dec 16, 2025 · Dec 16, 2025
diff --git a/wavefront/client/src/pages/apps/[appId]/llm-inference/CreateLLMInferenceDialog.tsx b/wavefront/client/src/pages/apps/[appId]/llm-inference/CreateLLMInferenceDialog.tsx
@@ -71,6 +71,7 @@ const createLLMInferenceSchema = z.object({
   displayName: z.string().min(1, 'Display name is required'),
   llmModel: z.string().min(1, 'LLM model name is required'),
   type: z.enum(['openai', 'anthropic', 'gemini', 'azure_openai', 'ollama', 'vllm', 'groq']),
+  modelType: z.enum(['llm', 'embedding']),
   apiKey: z.string().optional(),
   baseUrl: z.string().optional(),
 });
@@ -103,6 +104,7 @@ const CreateLLMInferenceDialog: React.FC<CreateLLMInferenceDialogProps> = ({
       displayName: '',
       llmModel: '',
       type: 'openai',
+      modelType: 'llm',
       apiKey: '',
       baseUrl: getDefaultBaseUrl('openai'),
     },
@@ -131,6 +133,7 @@ const CreateLLMInferenceDialog: React.FC<CreateLLMInferenceDialogProps> = ({
         displayName: '',
         llmModel: '',
         type: defaultType,
+        modelType: 'llm',
         apiKey: '',
         baseUrl: getDefaultBaseUrl(defaultType),
       });
@@ -171,6 +174,7 @@ const CreateLLMInferenceDialog: React.FC<CreateLLMInferenceDialogProps> = ({
         llm_model: data.llmModel.trim(),
         api_key: data.apiKey?.trim() || undefined,
         type: data.type,
+        model_type: data.modelType,
         base_url: data.baseUrl?.trim() || undefined,
         parameters: Object.keys(cleanedParams).length > 0 ? cleanedParams : undefined,
       });
@@ -366,6 +370,31 @@ const CreateLLMInferenceDialog: React.FC<CreateLLMInferenceDialogProps> = ({
                   </FormItem>
                 )}
               />
+
+              <FormField
+                control={form.control}
+                name="modelType"
+                render={({ field }) => (
+                  <FormItem>
+                    <FormLabel>
+                      Model Type<span className="text-red-500">*</span>
+                    </FormLabel>
+                    <Select onValueChange={field.onChange} value={field.value}>
+                      <FormControl>
+                        <SelectTrigger>
+                          <SelectValue placeholder="Select model type" />
+                        </SelectTrigger>
+                      </FormControl>
+                      <SelectContent>
+                        <SelectItem value="llm">LLM</SelectItem>
+                        <SelectItem value="embedding">Embedding</SelectItem>
+                      </SelectContent>
+                    </Select>
+                    <FormDescription>Choose whether this is an LLM or embedding model</FormDescription>
+                    <FormMessage />
+                  </FormItem>
+                )}
+              />
             </div>
 
             <div className="grid grid-cols-2 gap-6">

diff --git a/wavefront/client/src/pages/apps/[appId]/llm-inference/[configId].tsx b/wavefront/client/src/pages/apps/[appId]/llm-inference/[configId].tsx
@@ -48,6 +48,7 @@ const llmConfigFormSchema = z.object({
   llm_model: z.string().min(1, 'LLM model is required'),
   type: z.enum(['openai', 'anthropic', 'gemini', 'azure_openai', 'ollama', 'vllm', 'groq']),
   api_key: z.string().optional(),
+  model_type: z.enum(['llm', 'embedding']),
   base_url: z.string().optional(),
   parameters: z.record(z.any()).optional(),
 });
@@ -74,6 +75,7 @@ const LLMInferenceConfigDetail: React.FC = () => {
       display_name: '',
       llm_model: '',
       type: 'openai',
+      model_type: 'llm',
       api_key: '',
       base_url: '',
       parameters: {},
@@ -91,6 +93,7 @@ const LLMInferenceConfigDetail: React.FC = () => {
         display_name: config.display_name,
         llm_model: config.llm_model,
         type: config.type,
+        model_type: (config.model_type as 'llm' | 'embedding') || 'llm',
         api_key: '', // API key is never returned for security
         base_url: config.base_url || '',
         parameters: mergedParams,
@@ -134,6 +137,7 @@ const LLMInferenceConfigDetail: React.FC = () => {
         display_name: data.display_name.trim(),
         llm_model: data.llm_model.trim(),
         type: data.type,
+        model_type: data.model_type,
         parameters: Object.keys(cleanedParams).length > 0 ? cleanedParams : null,
       };
 
@@ -244,6 +248,7 @@ const LLMInferenceConfigDetail: React.FC = () => {
                         display_name: config.display_name,
                         llm_model: config.llm_model,
                         type: config.type,
+                        model_type: (config.model_type as 'llm' | 'embedding') || 'llm',
                         api_key: '',
                         base_url: config.base_url || '',
                         parameters: mergedParams,
@@ -369,6 +374,28 @@ const LLMInferenceConfigDetail: React.FC = () => {
                       )}
                     />
                   )}
+
+                  <FormField
+                    control={form.control}
+                    name="model_type"
+                    render={({ field }) => (
+                      <FormItem>
+                        <FormLabel>Model Type</FormLabel>
+                        <Select onValueChange={field.onChange} value={field.value} disabled={!editing}>
+                          <FormControl>
+                            <SelectTrigger>
+                              <SelectValue placeholder="Select model type" />
+                            </SelectTrigger>
+                          </FormControl>
+                          <SelectContent>
+                            <SelectItem value="llm">LLM</SelectItem>
+                            <SelectItem value="embedding">Embedding</SelectItem>
+                          </SelectContent>
+                        </Select>
+                        <FormMessage />
+                      </FormItem>
+                    )}
+                  />
                 </div>
               </form>
             </Form>

diff --git a/wavefront/client/src/types/llm-inference-config.ts b/wavefront/client/src/types/llm-inference-config.ts
@@ -7,6 +7,7 @@ export interface LLMInferenceConfig {
   llm_model: string;
   display_name: string;
   type: InferenceEngineType;
+  model_type?: string;
   base_url?: string;
   parameters?: Record<string, any> | null;
   is_deleted: boolean;
@@ -19,6 +20,7 @@ export interface CreateLLMConfigRequest {
   display_name: string;
   api_key?: string;
   type: InferenceEngineType;
+  model_type?: string;
   base_url?: string;
   parameters?: Record<string, any> | null;
 }
@@ -28,6 +30,7 @@ export interface UpdateLLMConfigRequest {
   display_name?: string;
   api_key?: string | null;
   type?: InferenceEngineType;
+  model_type?: string;
   base_url?: string | null;
   parameters?: Record<string, any> | null;
 }

diff --git a/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/models/doc_content.py b/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/models/doc_content.py
@@ -1,10 +1,11 @@
 from dataclasses import dataclass
 from typing import Union
+from rag_ingestion.processors.file_processor import DocumentType
 
 
 @dataclass
 class DocContent:
     """Model representing the extracted content from a document file"""
 
     content: Union[str, bytes]
-    parse_type: str
+    document_type: DocumentType
diff --git a/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/processors/file_processor.py b/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/processors/file_processor.py
@@ -1,48 +1,59 @@
 import os
 import tempfile
 import textract
-from typing import Union
+from typing import Tuple
+from enum import Enum
+from common_module.log.logger import logger
 
 
-class FileProcessor:
-    def process_file(self, file_content: bytes, file_type: str) -> Union[str, bytes]:
-        mime_type = file_type
+class DocumentType(Enum):
+    PDF = 'pdf'
+    IMAGE = 'image'
+    TEXT = 'text'
 
-        if mime_type.startswith('text/plain'):
-            return file_content.decode('utf-8')
 
-        if mime_type.startswith('image/'):
-            return file_content
+class FileProcessor:
+    def process_file(
+        self, file_content: bytes, file_type: str
+    ) -> Tuple[str | bytes, DocumentType]:
+        mime_type = file_type
+        document_type = self.extract_document_type(mime_type)
+        if document_type == DocumentType.TEXT:
+            return file_content.decode('utf-8'), DocumentType.TEXT
 
-        if mime_type.startswith('application/'):
-            try:
-                sub_type = mime_type.split('/')[1]
-            except IndexError:
-                raise ValueError(
-                    f'Unsupported file type: Malformed MIME type "{mime_type}"'
-                )
+        if document_type == DocumentType.IMAGE:
+            return file_content, DocumentType.IMAGE
 
-            # Set delete=False to keep the file until we manually call os.unlink
+        if document_type == DocumentType.PDF:
             with tempfile.NamedTemporaryFile(
-                mode='w+b', delete=False, suffix=f'.{sub_type}'
+                mode='w+b', delete=False, suffix='.pdf'
             ) as temp_file:
                 temp_file.write(file_content)
-                temp_file.flush()  # Ensure data is written to disk before processing
+                temp_file.flush()
                 temp_file_path = temp_file.name
 
             try:
-                # Process the file using its path
                 text_content = textract.process(
                     temp_file_path, method='pdfminer'
                 ).decode('utf-8')
-                return text_content
+                return text_content, DocumentType.PDF
 
             except Exception as e:
-                # Re-raise processing errors
+                logger.error(f'Text extraction failed for {mime_type}: {e}')
                 raise RuntimeError(f'Text extraction failed for {mime_type}: {e}')
 
             finally:
                 os.unlink(temp_file_path)
 
+        # Explicit raise to prevent implicit None return.
+        raise RuntimeError(f'Unsupported or unknown document type: {document_type}')
+
+    def extract_document_type(self, file_type: str) -> DocumentType:
+        if file_type.startswith('text/plain'):
+            return DocumentType.TEXT
+        if file_type.startswith('image/'):
+            return DocumentType.IMAGE
+        if file_type in ('application/pdf', 'application/x-pdf'):
+            return DocumentType.PDF
         else:
-            raise ValueError(f'Unsupported file type: {mime_type}')
+            raise ValueError(f'Unsupported file type: {file_type}')
diff --git a/...ont/server/background_jobs/rag_ingestion/rag_ingestion/processors/kb_storage_processor.py b/...ont/server/background_jobs/rag_ingestion/rag_ingestion/processors/kb_storage_processor.py
@@ -1,14 +1,14 @@
 from flo_cloud.cloud_storage import CloudStorageManager
 from dataclasses import dataclass
-from typing import List, Union
+from typing import List
 from flo_utils.utils.log import logger
 from rag_ingestion.service.kb_rag_storage import KBRagStorage
 from rag_ingestion.embeddings.embed import EmbeddingFunc
 from rag_ingestion.models.doc_content import DocContent
 from rag_ingestion.stream.queue_message import QueueMessage
 from flo_cloud.kms import FloKmsService
 from flo_utils.streaming.message_processor import MessageProcessor, ProcessingResult
-from rag_ingestion.processors.file_processor import FileProcessor
+from rag_ingestion.processors.file_processor import FileProcessor, DocumentType
 from rag_ingestion.embeddings.image_embed import ImageEmbedding
 from rag_ingestion.models.knowledge_base_embeddings import KnowledgeBaseEmbeddingObject
 from rag_ingestion.models.rag_message import RagEventMessage
@@ -20,7 +20,7 @@ class KbStorageInsights:
     doc_id: str
     doc_content: DocContent
     kb_id: str
-    file_type: str
+    file_type: DocumentType
 
 
 class KbStorageProcessor(MessageProcessor):
@@ -36,7 +36,7 @@ def __init__(
         self.file_processor = FileProcessor()
         self.image_embedding = ImageEmbedding()
 
-    async def _extract_text_from_message(
+    async def _extract_content(
         self, message: QueueMessage, file_content: bytes
     ) -> DocContent:
         """
@@ -49,12 +49,10 @@ async def _extract_text_from_message(
         Returns:
             A DocContent object with extracted content and parse_type.
         """
-        if message.parse_type != 'kb_insertion':
-            return DocContent(content='', parse_type=message.parse_type)
-        content: Union[str, bytes] = self.file_processor.process_file(
+        (content, document_type) = self.file_processor.process_file(
             file_content, str(message.file_type)
         )
-        return DocContent(content=content, parse_type=message.parse_type)
+        return DocContent(content=content, document_type=document_type)
 
     def __insert_kb_from_message(
         self, insights: List[ProcessingResult[KbStorageInsights]]
@@ -74,27 +72,29 @@ def __insert_kb_from_message(
             for kb_insight in insights:
                 kb_id = kb_insight.insights.kb_id
                 doc_id = kb_insight.insights.doc_id
-                file_type = kb_insight.insights.file_type
+                document_type = kb_insight.insights.doc_content.document_type
 
                 logger.info('Embeddings storing process is started')
-                if file_type and file_type.lower() in ('pdf', 'application/pdf'):
+                if (
+                    document_type == DocumentType.PDF
+                    or document_type == DocumentType.TEXT
+                ):
                     extracted_docs = [kb_insight.insights.doc_content.content]
                     docs: List[KnowledgeBaseEmbeddingObject] = (
                         self.kb_rag_storage.process_document(extracted_docs)
                     )
-                else:
+                elif document_type == DocumentType.IMAGE:
                     image_data = [kb_insight.insights.doc_content.content]
                     docs: List[KnowledgeBaseEmbeddingObject] = [
                         self.image_embedding.embed_image(image_data)
                         for image_data in image_data
                     ]
-
                 embeddings.append(
                     EmbeddingsToStore(
                         kb_embeddings=docs,
                         doc_id=doc_id,
                         kb_id=kb_id,
-                        file_type=file_type,
+                        file_type=document_type,
                     )
                 )
 
@@ -126,14 +126,14 @@ async def process(
             if self.encryption_service
             else file_content_encrypt
         )
-        doc_content = await self._extract_text_from_message(message, file_content)
+        doc_content = await self._extract_content(message, file_content)
         return ProcessingResult[KbStorageInsights](
             success=True,
             insights=KbStorageInsights(
                 doc_id=message.doc_id,
                 doc_content=doc_content,
                 kb_id=message.kb_id,
-                file_type=message.file_type,
+                file_type=doc_content.document_type,
             ),
         )
 

diff --git a/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/service/kb_rag_storage.py b/wavefront/server/background_jobs/rag_ingestion/rag_ingestion/service/kb_rag_storage.py
@@ -1,29 +1,30 @@
-from typing import Any, List, Dict, Tuple, Optional
 import logging
-import numpy as np
 import tiktoken
-from datetime import datetime
 import uuid
-from rag_ingestion.embeddings.embed import EmbeddingFunc
 import httpx
 import time
+import ast
+import numpy as np
+from flo_utils.utils.log import logger
+from datetime import datetime
 from dataclasses import dataclass
 from rag_ingestion.env import FLOWARE_SERVICE_URL, APP_ENV, PASSTHROUGH_SECRET
 from rag_ingestion.constants.auth import RootfloHeaders
 from rag_ingestion.models.knowledge_base_embeddings import (
     KnowledgeBaseEmbeddingObject,
     RetrieveParams,
 )
-from flo_utils.utils.log import logger
-import ast
+from typing import Any, List, Dict, Tuple, Optional
+from rag_ingestion.embeddings.embed import EmbeddingFunc
+from rag_ingestion.processors.file_processor import DocumentType
 
 
 @dataclass
 class EmbeddingsToStore:
     kb_embeddings: List[KnowledgeBaseEmbeddingObject]
     doc_id: str
     kb_id: str
-    file_type: str
+    file_type: DocumentType
 
 
 class KBRagStorage: