About to trounce on system prompt

2025-05-11 22:35:09 -07:00 · 2025-05-11 22:35:09 -07:00 · bcb1e866cb
commit bcb1e866cb
parent 538caba9f4
5 changed files with 188 additions and 57 deletions
--- a/README.md
+++ b/README.md
@ -5,8 +5,7 @@ Backstory is an AI Resume agent that provides context into a diverse career narr
 * WIP: Through the use of several custom Language Processing Modules (LPM), develop a comprehensive set of test and validation data based on the input documents. While manual review of content should be performed to ensure accuracy, several LLM techniques are employed in the LPM in order to isolate and remove hallucinations and inaccuracies in the test and validation data.
 * WIP: Utilizing quantized low-rank adaption (QLoRA) and parameter effecient tine tuning (PEFT,) provide a hyper parameter tuned and customized LLM for use in chat and content creation scenarios with expert knowledge about the individual. 
 * Post-training, utilize additional RAG content to further enhance the information domain used in conversations and content generation.
-* An integrated document publishing work flow that will transform a "Job Description" into a customized "Resume" for the person the LLM has been trained on.
-* "Fact Check" the resulting resume against the RAG content directly provided by the user in order to remove hallucinations.
+* An integrated document publishing work flow that will transform a "Job Description" into a customized "Resume" for the person the LLM has been trained on, incorporating a multi-stage "Fact Check" to reduce hallucination.

 While it can run a variety of LLM models, Backstory is currently running Qwen2.5:7b. In addition to the standard model, the chat pipeline also exposes several utility tools for the LLM to use to obtain real-time data.

@ -20,7 +19,7 @@ Before you spend too much time learning how to customize Backstory, you may want

 The `./docs` directory has been seeded with an AI generated persona. That directory is only used during development; actual content should be put into the `./docs-prod` directory.

-Launching with the defaults, you can ask things like `Who is Eliza Morgan?`
+Launching with the defaults (which includes the AI generated persona), you can ask things like `Who is Eliza Morgan?`

 If you want to seed your own data:

--- a/frontend/public/docs/resume-generation.md
+++ b/frontend/public/docs/resume-generation.md
@ -22,22 +22,26 @@ flowchart TD
            A1[Job Description Input] --> A2[Job Analysis LLM]
            A2 --> A3[Job Requirements JSON]
        end
-        
+
        subgraph "Stage 1B: Candidate Analysis"
-            B1[Resume & Context Input] --> B2[Candidate Analysis LLM]
-            B2 --> B3[Candidate Qualifications JSON]
+            B1[Resume Input] --> B5[Candidate Analysis LLM]
+            B5 --> B4[Candidate Qualifications JSON]
+            B2[Candidate Info] --> B3[RAG]
+            B3[RAG] --> B2[Candidate Info]
+            A3[Job Requirements JSON] --> B3[RAG]
+            B3[RAG] --> B5
        end
        
        subgraph "Stage 1C: Mapping Analysis"
-            C1[Job Requirements JSON] --> C2[Candidate Qualifications JSON]
-            C2 --> C3[Mapping Analysis LLM]
+            C1[Job Requirements JSON] --> C3[Mapping Analysis LLM]
+            C2[Candidate Qualifications JSON] --> C3
            C3 --> C4[Skills Mapping JSON]
        end
    end
    
    subgraph "Stage 2: Resume Generation"
-        D1[Skills Mapping JSON] --> D2[Original Resume Reference]
-        D2 --> D3[Resume Generation LLM]
+        D1[Skills Mapping JSON] --> D3[Resume Generation LLM]
+        D2[Original Resume Reference] --> D3
        D3 --> D4[Tailored Resume Draft]
    end
    
@ -52,12 +56,13 @@ flowchart TD
    end
    
    A3 --> C1
-    B3 --> C2
+    B4 --> C2
    C4 --> D1
+    C4 --> E1
    D4 --> E3
    
    style A2 fill:#f9d77e,stroke:#333,stroke-width:2px
-    style B2 fill:#f9d77e,stroke:#333,stroke-width:2px
+    style B5 fill:#f9d77e,stroke:#333,stroke-width:2px
    style C3 fill:#f9d77e,stroke:#333,stroke-width:2px
    style D3 fill:#f9d77e,stroke:#333,stroke-width:2px
    style E4 fill:#f9d77e,stroke:#333,stroke-width:2px
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@ -15,7 +15,6 @@ import Box from '@mui/material/Box';
 import CssBaseline from '@mui/material/CssBaseline';
 import MenuIcon from '@mui/icons-material/Menu';

-
 import { Snack, SeverityType } from './Snack';
 import { ConversationHandle } from './Conversation';
 import { QueryOptions } from './ChatQuery';
@ -116,8 +115,8 @@ const App = () => {
      children: <AboutPage {...{ sessionId, setSnack, submitQuery: handleSubmitChatQuery, route: subRoute, setRoute: setSubRoute }} />
    };

-    const settingsTab: BackstoryTabProps = {
-      path: "settings",
+    const controlsTab: BackstoryTabProps = {
+      path: "controls",
      tabProps: {
        sx: { flexShrink: 1, flexGrow: 0, fontSize: '1rem' },
        icon: <SettingsIcon />
@ -145,7 +144,7 @@ const App = () => {
      resumeBuilderTab,
      contextVisualizerTab,
      aboutTab,
-      settingsTab,
+      controlsTab,
    ];
  }, [sessionId, setSnack, subRoute]);

@ -214,7 +213,7 @@ const App = () => {
      const path_session = pathParts.length < 2 ? pathParts[0] : pathParts[1];
      if (!isValidUUIDv4(path_session)) {
        console.log(`Invalid session id ${path_session}-- creating new session`);
-        fetchSession([pathParts[0]]);
+        fetchSession();
      } else {
        let tabIndex = tabs.findIndex((tab) => tab.path === currentPath);
        if (-1 === tabIndex) {
--- a/frontend/src/ResumeBuilderPage.tsx
+++ b/frontend/src/ResumeBuilderPage.tsx
@ -84,7 +84,8 @@ const ResumeBuilderPage: React.FC<BackstoryPageProps> = ({
    }

    /* Filter out the 2nd and 3rd (0-based) */
-    const filtered = messages.filter((m, i) => i !== 1 && i !== 2);
+    const filtered = messages;//.filter((m, i) => i !== 1 && i !== 2);
+    console.warn("Set filtering back on");

    return filtered;
  }, [setHasResume, setHasFacts]);
--- a/src/utils/agents/job_description.py
+++ b/src/utils/agents/job_description.py
@ -166,9 +166,9 @@ class JobDescription(Agent):
    if not self.context:
      raise ValueError("Context is not set for this agent.")
    
-    async for message in super().prepare_message(message):
-      if message.status != "done":
-        yield message
+    # async for message in super().prepare_message(message):
+    #   if message.status != "done":
+    #     yield message
    # Always add the job description, user resume, and question
    message.preamble["job_description"] = self.job_description
    message.preamble["resume"] = self.context.user_resume
@ -185,11 +185,47 @@ class JobDescription(Agent):

    original_prompt = message.prompt

-    async for message in super().process_message(llm=llm, model=model, message=message):
-      if message.status != "done":
+    logger.info("TODO: Implement delay queing; busy for same agent, otherwise return queue size and estimated wait time")
+    spinner: List[str] = ['\\', '|', '/', '-']
+    tick : int = 0
+    while self.context.processing:
+        message.status = "waiting"
+        message.response = f"Busy processing another request. Please wait. {spinner[tick]}"
+        tick = (tick + 1) % len(spinner)
        yield message
-    if message.status == "error":
-       return
+        await asyncio.sleep(1)  # Allow the event loop to process the write
+
+    self.context.processing = True
+
+    original_message = message.model_copy()
+
+    self.llm = llm
+    self.model = model
+    self.metrics.generate_count.labels(agent=self.agent_type).inc()
+    with self.metrics.generate_duration.labels(agent=self.agent_type).time():
+      job_description = message.preamble["job_description"]
+      resume = message.preamble["resume"]
+      
+      try:
+        async for message in self.generate_factual_tailored_resume(message=message, job_description=job_description, resume=resume):
+          if message.status != "done":
+            yield message
+        message.prompt = original_message.prompt
+        yield message
+
+      except Exception as e:
+        message.status = "error"
+        logger.error(message.response)
+        message.response = f"Error in resume generation process: {str(e)}"
+        logger.error(message.response)
+        logger.error(traceback.format_exc())
+        yield message
+        return
+    
+    # Done processing, add message to conversation
+    message.status = "done"
+    self.conversation.add(message)
+    self.context.processing = False

    # Add the "Job requirements" message
    if "generate_factual_tailored_resume" in message.metadata and "job_requirements" in message.metadata["generate_factual_tailored_resume"]:
@ -964,7 +1000,115 @@ Based on the reference data above, please create a corrected version of the resu
      metadata["results"] = message.response
      yield message

-  async def generate_factual_tailored_resume(self, message: Message, job_description: str, resume: str, additional_context: str = "") -> AsyncGenerator[Message, None]:
+  def process_job_requirements(self, job_requirements: Dict[str, Any]) -> List[Dict[str, Any]]:
+    """
+    Process job requirements JSON, gather RAG documents using find_similar, remove duplicates, 
+    and return top 20 results.
+    
+    Args:
+        job_requirements: Dictionary containing job requirements.
+        retriever: Instance of RagRetriever with find_similar method.
+    
+    Returns:
+        List of up to 20 ChromaDB documents, sorted by combined importance and similarity score.
+    """
+    if self.context is None or self.context.file_watcher is None:
+       raise ValueError(f"context or file_watcher is None on {self.agent_type}")
+
+    retriever = self.context.file_watcher
+    # Importance weights for each category
+    importance_weights = {
+        ("technical_skills", "required"): 1.0,
+        ("technical_skills", "preferred"): 0.8,
+        ("experience_requirements", "required"): 0.95,
+        ("experience_requirements", "preferred"): 0.75,
+        ("education_requirements", ""): 0.7,
+        ("soft_skills", ""): 0.6,
+        ("industry_knowledge", ""): 0.65,
+        ("responsibilities", ""): 0.85,
+        ("company_values", ""): 0.5
+    }
+    
+    # Store all RAG results with metadata
+    all_results = []
+    
+    def traverse_requirements(data: Any, category: str = "", subcategory: str = ""):
+        """
+        Recursively traverse the job requirements and gather RAG documents.
+        """
+        if isinstance(data, dict):
+            for key, value in data.items():
+                new_subcategory = key if category else ""
+                traverse_requirements(value, category or key, new_subcategory)
+        elif isinstance(data, list):
+            for item in data:
+                # Determine the weight key
+                weight_key = (category, subcategory) if subcategory else (category, "")
+                weight = importance_weights.get(weight_key, 0.5)  # Default weight
+                
+                # Call find_similar for the item
+                try:
+                    rag_results = retriever.find_similar(item, top_k=10, threshold=0.7)
+                    # Process each result
+                    for doc_id, content, distance, metadata in zip(
+                        rag_results["ids"], 
+                        rag_results["documents"], 
+                        rag_results["distances"], 
+                        rag_results["metadatas"]
+                    ):
+                        # Convert cosine distance to similarity score (higher is better)
+                        similarity_score = 1 - distance  # Cosine distance to similarity
+                        all_results.append({
+                            "id": doc_id,
+                            "content": content,
+                            "score": similarity_score,
+                            "weight": weight,
+                            "context": item,
+                            "category": category,
+                            "subcategory": subcategory,
+                            "metadata": metadata
+                        })
+                except Exception as e:
+                    logger.error(f"Error processing context '{item}': {e}")
+    
+    # Start traversal
+    traverse_requirements(job_requirements)
+    
+    # Remove duplicates based on document ID
+    unique_results = []
+    seen_ids = set()
+    for result in all_results:
+        if result["id"] not in seen_ids:
+            seen_ids.add(result["id"])
+            unique_results.append(result)
+    
+    # Sort by combined score (weight * similarity score)
+    sorted_results = sorted(
+        unique_results,
+        key=lambda x: x["weight"] * x["score"],
+        reverse=True
+    )
+    
+    # Return top 20 results
+    return sorted_results[:20]
+
+
+  async def generate_rag_content(self, message: Message, job_requirements: Dict[str, Any]) -> AsyncGenerator[Message, None]:
+    results = self.process_job_requirements(job_requirements = job_requirements)
+    message.response = f"Retrieved {len(results)} documents:\n"
+    for result in results:
+        message.response += f"""
+ID: {result['id']}, Context: {result['context']}, \
+Category: {result['category']}/{result['subcategory']}, \
+Similarity Score: {result['score']:.3f}, \
+Combined Score: {result['weight'] * result['score']:.3f}, \
+Content: {result['content']}
+"""
+    message.status = "done"
+    yield message
+    return
+  
+  async def generate_factual_tailored_resume(self, message: Message, job_description: str, resume: str) -> AsyncGenerator[Message, None]:
    """
    Main function to generate a factually accurate tailored resume.
    
@ -976,6 +1120,9 @@ Based on the reference data above, please create a corrected version of the resu
    Returns:
        Dict containing the generated resume and supporting analysis
    """
+    if self.context is None:
+       raise ValueError(f"context is None in {self.agent_type}")
+    
    message.status = "thinking"
    logger.info(message.response)
    yield message
@ -999,6 +1146,17 @@ Based on the reference data above, please create a corrected version of the resu
    message.response = "Multi-stage RAG resume generation process: Stage 1B: Analyzing candidate qualifications"
    logger.info(message.response)
    yield message
+
+    async for message in self.generate_rag_content(message, job_requirements):
+       if message.status != "done":
+        yield message
+    if message.status == "error":
+      return
+
+    yield message    
+    return
+
+    additional_context = message.preamble["context"]
    metadata["analyze_candidate_qualifications"] = {
        "additional_context": additional_context
    }
@ -1122,37 +1280,6 @@ Based on the reference data above, please create a corrected version of the resu

    logger.info("Resume generation process completed successfully")
    return
-
-  # Main orchestration function
-  async def generate_llm_response(self, llm: Any, model: str, message: Message, temperature=0.7) -> AsyncGenerator[Message, None]:
-    logger.info(f"{self.agent_type} - {inspect.stack()[0].function}")
-    
-    original_message = message.model_copy()
-
-    self.llm = llm
-    self.model = model
-    self.metrics.generate_count.labels(agent=self.agent_type).inc()
-    with self.metrics.generate_duration.labels(agent=self.agent_type).time():
-      job_description = message.preamble["job_description"]
-      resume = message.preamble["resume"]
-      additional_context = message.preamble["context"]
-
-      try:
-        async for message in self.generate_factual_tailored_resume(message=message, job_description=job_description, resume=resume, additional_context=additional_context):
-          if message.status != "done":
-            yield message
-        message.prompt = original_message.prompt
-        yield message
-        return
-      except Exception as e:
-        message.status = "error"
-        logger.error(message.response)
-        message.response = f"Error in resume generation process: {str(e)}"
-        logger.error(message.response)
-        logger.error(traceback.format_exc())
-        yield message
-        return
-
       

 # Register the base agent