Starting to work again

2025-04-29 01:28:48 -07:00 · 2025-04-29 01:28:48 -07:00 · 5806563777
commit 5806563777
parent dc55196311
8 changed files with 339 additions and 186 deletions
--- a/frontend/src/Conversation.tsx
+++ b/frontend/src/Conversation.tsx
@ -24,6 +24,23 @@ interface ConversationHandle {
  submitQuery: (query: string) => void;
 }
 interface BackstoryMessage {
  prompt: string;
  preamble: string;
  content: string;
  response: string;
  metadata: {
    rag: { documents: [] };
    tools: string[];
    eval_count: number;
    eval_duration: number;
    prompt_eval_count: number;
    prompt_eval_duration: number;
  };
  actions: string[];
  timestamp: string;
 };
 interface ConversationProps {
  className?: string,         // Override default className
  type: ConversationMode,     // Type of Conversation chat
@ -168,7 +185,33 @@ const Conversation = forwardRef<ConversationHandle, ConversationProps>(({
          setNoInteractions(true);
        } else {
          console.log(`History returned for ${type} from server with ${messages.length} entries:`, messages)
-          setConversation(messages);
+
          const backstoryMessages: BackstoryMessage[] = messages;
          // type MessageData = {
          //   role: MessageRoles,
          //   content: string,
          //   disableCopy?: boolean,
          //   user?: string,
          //   title?: string,
          //   origin?: string,
          //   display?: string, /* Messages generated on the server for filler should not be shown */
          //   id?: string,
          //   isProcessing?: boolean,
          //   metadata?: MessageMetaData
          // };
          setConversation(backstoryMessages.flatMap((message: BackstoryMessage) => [{
            role: 'user',
            content: message.prompt || "",
          }, {
            role: 'assistant',
            prompt: message.prompt || "",
            preamble: message.preamble || "",
            full_content: message.content || "",
            content: message.response || "",
            metadata: message.metadata,
            actions: message.actions,
          }] as MessageList));
          setNoInteractions(false);
        }
        setProcessingMessage(undefined);
@ -372,10 +415,20 @@ const Conversation = forwardRef<ConversationHandle, ConversationProps>(({
                update.message = onResponse(update.message);
              }
              setProcessingMessage(undefined);
              const backstoryMessage: BackstoryMessage = update.message;
              setConversation([
-                ...conversationRef.current,
+                ...conversationRef.current, {
-                update.message
+                  role: 'user',
-              ])
+                  content: backstoryMessage.prompt || "",
                }, {
                  role: 'assistant',
                  prompt: backstoryMessage.prompt || "",
                  preamble: backstoryMessage.preamble || "",
                  full_content: backstoryMessage.content || "",
                  content: backstoryMessage.response || "",
                  metadata: backstoryMessage.metadata,
                  actions: backstoryMessage.actions,
                }] as MessageList);
              // Add a small delay to ensure React has time to update the UI
              await new Promise(resolve => setTimeout(resolve, 0));
@ -414,10 +467,20 @@ const Conversation = forwardRef<ConversationHandle, ConversationProps>(({
              update.message = onResponse(update.message);
            }
            setProcessingMessage(undefined);
            const backstoryMessage: BackstoryMessage = update.message;
            setConversation([
-              ...conversationRef.current,
+              ...conversationRef.current, {
-              update.message
+                role: 'user',
-            ]);
+                content: backstoryMessage.prompt || "",
              }, {
                role: 'assistant',
                prompt: backstoryMessage.prompt || "",
                preamble: backstoryMessage.preamble || "",
                full_content: backstoryMessage.content || "",
                content: backstoryMessage.response || "",
                metadata: backstoryMessage.metadata,
                actions: backstoryMessage.actions,
              }] as MessageList);            
          }
        } catch (e) {
          setSnack("Error processing query", "error")
--- a/frontend/src/Message.tsx
+++ b/frontend/src/Message.tsx
@ -224,8 +224,7 @@ const MessageMeta = (props: MessageMetaProps) => {
          <AccordionDetails>
            {Object.entries(props.messageProps.message)
              .filter(([key, value]) => key !== undefined && value !== undefined)
-              .map(([key, value]) => (<>
+              .map(([key, value]) => (typeof (value) !== "string" || value?.trim() !== "") &&
                {(typeof (value) !== "string" || value?.trim() !== "") &&
                  <Accordion key={key}>
                    <AccordionSummary sx={{ fontSize: "1rem", fontWeight: "bold" }} expandIcon={<ExpandMoreIcon />}>
                      {key}
@ -235,7 +234,7 @@ const MessageMeta = (props: MessageMetaProps) => {
                        Object.entries(value)
                          .filter(([key, value]) => key !== undefined && value !== undefined)
                          .map(([key, value]) => (
-                            <Accordion key={`${key}-metadata`}>
+                            <Accordion key={`metadata.${key}`}>
                              <AccordionSummary sx={{ fontSize: "1rem", fontWeight: "bold" }} expandIcon={<ExpandMoreIcon />}>
                                {key}
                              </AccordionSummary>
@ -249,9 +248,6 @@ const MessageMeta = (props: MessageMetaProps) => {
                      }
                    </AccordionDetails>
                </Accordion>
                }
              </>
              )
            )}
          </AccordionDetails>
        </Accordion>
--- a/src/kill-server.sh
+++ b/src/kill-server.sh
@ -0,0 +1,57 @@
 #!/bin/bash
 # Ensure input was provided
 if [[ -z "$1" ]]; then
    echo "Usage: $0 <path/to/python_script.py>"
    exit 1
 fi
 # Resolve user-supplied path to absolute path
 TARGET=$(readlink -f "$1")
 if [[ ! -f "$TARGET" ]]; then
    echo "Target file '$TARGET' not found."
    exit 1
 fi
 # Loop through python processes and resolve each script path
 PID=""
 for pid in $(pgrep -f python); do
    if [[ -r "/proc/$pid/cmdline" ]]; then
        # Get the full command line, null-separated
        cmdline=$(tr '\0' ' ' < "/proc/$pid/cmdline")
        # Extract the script argument (naively assumes it's the first non-option)
        script_arg=$(echo "$cmdline" | awk '{for (i=2;i<=NF;i++) if ($i !~ /^-/) {print $i; exit}}')
        # Try resolving the script path relative to the process's cwd
        script_path=$(readlink -f "/proc/$pid/cwd/$script_arg" 2>/dev/null)
        if [[ "$script_path" == "$TARGET" ]]; then
            PID=$pid
            break
        fi
    fi
 done
 if [[ -z "$PID" ]]; then
    echo "No Python process found running '$TARGET'."
    exit 1
 fi
 echo "Found process $PID running $TARGET"
 # Get times
 file_time=$(stat -c %Y "$TARGET")
 proc_time=$(stat -c %Y "/proc/$PID")
 # if (( file_time > proc_time )); then
 #     echo "Script '$TARGET' is newer than process $PID. Killing $PID"
    kill -9 "$PID"
    if [[ $? -ne 0 ]]; then
        echo "Failed to kill process $PID."
        exit 1
    fi
    echo "Process $PID killed."
 # else
 #     echo "Script '$TARGET' is older than or same age as process $PID."
 # fi
--- a/src/server.py
+++ b/src/server.py
@ -44,7 +44,7 @@ from sklearn.preprocessing import MinMaxScaler
 from utils import (
    rag as Rag,
-    Context, Conversation, Message, Chat, Resume, JobDescription, FactCheck,
+    Context, Conversation, Session, Message, Chat, Resume, JobDescription, FactCheck,
    defines
 )
@ -74,8 +74,8 @@ When answering queries, follow these steps:
 - When both <|context|> and tool outputs are relevant, synthesize information from both sources to provide the most complete answer
 - Always prioritize the most up-to-date and relevant information, whether it comes from <|context|> or tools
 - If <|context|> and tool outputs contain conflicting information, prefer the tool outputs as they likely represent more current data
- If there is information in the <|context|>, <|job_description|>, or <|work_history|> sections to enhance the answer, incorporate it seamlessly and refer to it as 'the latest information' or 'recent data' instead of mentioning '<|context|>' (etc.) or quoting it directly.
+- If there is information in the <|context|>, <|job_description|>, or <|context|> sections to enhance the answer, incorporate it seamlessly and refer to it as 'the latest information' or 'recent data' instead of mentioning '<|context|>' (etc.) or quoting it directly.
- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, or <|work_history|> tags.
+- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, or <|context|> tags.
 Always use tools and <|context|> when possible. Be concise, and never make up information. If you do not know the answer, say so.
 """
@ -83,21 +83,21 @@ Always use tools and <|context|> when possible. Be concise, and never make up in
 system_generate_resume = f"""
 Launched on {DateTime()}.
-You are a professional resume writer. Your task is to write a concise, polished, and tailored resume for a specific job based only on the individual's <|work_history|>.
+You are a professional resume writer. Your task is to write a concise, polished, and tailored resume for a specific job based only on the individual's <|context|>.
 When answering queries, follow these steps:
- You must not invent or assume any inforation not explicitly present in the <|work_history|>.
+- You must not invent or assume any inforation not explicitly present in the <|context|>.
 - Analyze the <|job_description|> to identify skills required for the job.
- Use the <|job_description|> provided to guide the focus, tone, and relevant skills or experience to highlight from the <|work_history|>. 
+- Use the <|job_description|> provided to guide the focus, tone, and relevant skills or experience to highlight from the <|context|>. 
- Identify and emphasize the experiences, achievements, and responsibilities from the <|work_history|> that best align with the <|job_description|>.
+- Identify and emphasize the experiences, achievements, and responsibilities from the <|context|> that best align with the <|job_description|>.
- Only provide information from <|work_history|> items if it is relevant to the <|job_description|>.
+- Only provide information from <|context|> items if it is relevant to the <|job_description|>.
- Do not use the <|job_description|> skills unless listed in <|work_history|>.
+- Do not use the <|job_description|> skills unless listed in <|context|>.
- Do not include any information unless it is provided in <|work_history|>.
+- Do not include any information unless it is provided in <|context|>.
- Use the <|work_history|> to create a polished, professional resume.
+- Use the <|context|> to create a polished, professional resume.
 - Do not list any locations or mailing addresses in the resume.
- If there is information in the <|context|>, <|job_description|>, <|work_history|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
+- If there is information in the <|context|>, <|job_description|>, <|context|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, or <|work_history|> tags.
+- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, or <|context|> tags.
 - Ensure the langauge is clear, concise, and aligned with industry standards for professional resumes.
 Structure the resume professionally with the following sections where applicable:
@ -105,7 +105,7 @@ Structure the resume professionally with the following sections where applicable
 * Name: Use full name
 * Professional Summary: A 2-4 sentence overview tailored to the job.
 * Skills: A bullet list of key skills derived from the work history and relevant to the job.
-* Professional Experience: A detailed list of roles, achievements, and responsibilities from <|work_history|> that relate to the <|job_description|>.
+* Professional Experience: A detailed list of roles, achievements, and responsibilities from <|context|> that relate to the <|job_description|>.
 * Education: Include only if available in the work history.
 * Notes: Indicate the initial draft of the resume was generated using the Backstory application.
@ -114,17 +114,27 @@ Structure the resume professionally with the following sections where applicable
 system_fact_check = f"""
 Launched on {DateTime()}.
-You are a professional resume fact checker. Your task is to identify any inaccuracies in the <|resume|> based on the individual's <|work_history|>.
+You are a professional resume fact checker. Your task is to identify any inaccuracies in the <|resume|> based on the individual's <|context|>.
 If there are inaccuracies, list them in a bullet point format.
 When answering queries, follow these steps:
- You must not invent or assume any information not explicitly present in the <|work_history|>.
+- You must not invent or assume any information not explicitly present in the <|context|>.
- Analyze the <|resume|> to identify any discrepancies or inaccuracies based on the <|work_history|>.
+- Analyze the <|resume|> to identify any discrepancies or inaccuracies based on the <|context|>.
- If there is information in the <|context|>, <|job_description|>, <|work_history|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
+- If there is information in the <|context|>, <|job_description|>, <|context|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, <|resume|>, or <|work_history|> tags.
+- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, <|resume|>, or <|context|> tags.
 """.strip()
 system_fact_check_QA = f"""
 Launched on {DateTime()}.
 You are a professional resume fact checker. 
 You are provided with a <|resume|> which was generated by you, the <|context|> you used to generate that <|resume|>, and a <|fact_check|> generated by you when you analyzed <|context|> against the <|resume|> to identify dicrepancies.
 Your task is to answer questions about the <|fact_check|> you generated based on the <|resume|> and <|context>.
 """
 system_job_description = f"""
 Launched on {DateTime()}.
@ -133,8 +143,8 @@ You are a hiring and job placing specialist. Your task is to answers about a job
 When answering queries, follow these steps:
 - Analyze the <|job_description|> to provide insights for the asked question.
 - If any financial information is requested, be sure to account for inflation.
- If there is information in the <|context|>, <|job_description|>, <|work_history|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
+- If there is information in the <|context|>, <|job_description|>, <|context|>, or <|resume|> sections to enhance the answer, incorporate it seamlessly and refer to it using natural language instead of mentioning '<|job_description|>' (etc.) or quoting it directly.
- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, <|resume|>, or <|work_history|> tags.
+- Avoid phrases like 'According to the <|context|>' or similar references to the <|context|>, <|job_description|>, <|resume|>, or <|context|> tags.
 """.strip()
 def get_installed_ram():
@ -263,7 +273,7 @@ def setup_logging(level):
 # %%
-async def AnalyzeSite(url, question):
+async def AnalyzeSite(llm, model: str, url : str, question : str):
    """
    Fetches content from a URL, extracts the text, and uses Ollama to summarize it.
@ -273,7 +283,6 @@ async def AnalyzeSite(url, question):
    Returns:
        str: A summary of the website content
    """
    global model, client
    try:
        # Fetch the webpage
        headers = {
@ -308,7 +317,7 @@ async def AnalyzeSite(url, question):
        # Generate summary using Ollama
        prompt = f"CONTENTS:\n\n{text}\n\n{question}"
-        response = client.generate(model=model, 
+        response = llm.generate(model=model, 
                                   system="You are given the contents of {url}. Answer the question about the contents",
                                   prompt=prompt)
@ -344,68 +353,6 @@ def find_summarize_tool(tools):
 def llm_tools(tools):
    return [tool for tool in tools if tool.get("enabled", False) == True]
 # %%
 async def handle_tool_calls(message):
    """
    Process tool calls and yield status updates along the way.
    The last yielded item will be a tuple containing (tool_result, tools_used).
    """
    tools_used = []
    all_responses = []
    for i, tool_call in enumerate(message["tool_calls"]):
        arguments = tool_call["function"]["arguments"]
        tool = tool_call["function"]["name"]
        # Yield status update before processing each tool
        yield {"status": "processing", "message": f"Processing tool {i+1}/{len(message['tool_calls'])}: {tool}..."}
        # Process the tool based on its type
        match tool:
            case "TickerValue":
                ticker = arguments.get("ticker")
                if not ticker:
                    ret = None
                else:
                    ret = TickerValue(ticker)
                tools_used.append({ "tool": f"{tool}({ticker})", "result": ret})
            case "AnalyzeSite":
                url = arguments.get("url")
                question = arguments.get("question", "what is the summary of this content?")
                # Additional status update for long-running operations
                yield {"status": "processing", "message": f"Retrieving and summarizing content from {url}..."}
                ret = await AnalyzeSite(url, question)
                tools_used.append({ "tool": f"{tool}('{url}', '{question}')", "result": ret })
            case "DateTime":
                tz = arguments.get("timezone")
                ret = DateTime(tz)
                tools_used.append({ "tool": f"{tool}('{tz}')", "result": ret })
            case "WeatherForecast":
                city = arguments.get("city")
                state = arguments.get("state")
                yield {"status": "processing", "message": f"Fetching weather data for {city}, {state}..."}
                ret = WeatherForecast(city, state)
                tools_used.append({ "tool": f"{tool}('{city}', '{state}')", "result": ret })
            case _:
                ret = None
        # Build response for this tool
        tool_response = {
            "role": "tool",
            "content": str(ret),
            "name": tool_call["function"]["name"]
        }
        all_responses.append(tool_response)
    # Yield the final result as the last item
    final_result = all_responses[0] if len(all_responses) == 1 else all_responses
    yield (final_result, tools_used)
@ -562,11 +509,11 @@ class WebServer:
                                case "chat":
                                    prompt = system_message
                                case "job_description":
-                                    prompt = system_job_description
+                                    prompt = system_generate_resume
                                case "resume":
                                    prompt = system_generate_resume
                                case "fact_check":
-                                    prompt = system_fact_check
+                                    prompt = system_message
                            session.system_prompt = prompt
                            response["system_prompt"] = { "system_prompt": prompt }
@ -592,7 +539,7 @@ class WebServer:
                                if not tmp:
                                    continue
                                logging.info(f"Resetting {reset_operation} for {mode}")
-                                context.conversation = []
+                                context.conversation = Conversation()
                                context.context_tokens = round(len(str(session.system_prompt)) * 3 / 4) # Estimate context usage
                            response["history"] = []
                            response["context_used"] = session.context_tokens
@ -695,23 +642,27 @@ class WebServer:
        @self.app.post("/api/chat/{context_id}/{session_type}")
        async def post_chat_endpoint(context_id: str, session_type: str, request: Request):
            logging.info(f"{request.method} {request.url.path}")
            try:
                if not is_valid_uuid(context_id):
                    logging.warning(f"Invalid context_id: {context_id}")
                    return JSONResponse({"error": "Invalid context_id"}, status_code=400)
                context = self.upsert_context(context_id)
            session = context.get_session(session_type)
            if not session:
                try:
                    session = context.create_session(session_type)
                except Exception as e:
                    return JSONResponse({ "error": f"{session_type} is not recognized", "context": context.id }, status_code=404)   
                try:
                    data = await request.json()
                    session = context.get_session(session_type)
                    if not session and session_type == "job_description":
                        logging.info(f"Session {session_type} not found. Returning empty history.")
                        # Create a new session if it doesn't exist
                        session = context.get_or_create_session("job_description", system_prompt=system_generate_resume, job_description=data["content"])
                except Exception as e:
                    logging.info(f"Attempt to create session type: {session_type} failed", e)
                    return JSONResponse({ "error": f"{session_type} is not recognized", "context": context.id }, status_code=404)   
                # Create a custom generator that ensures flushing
                async def flush_generator():
-                async for message in self.generate_response(context=context, session_type=session_type, content=data["content"]):
+                    async for message in self.generate_response(context=context, session=session, content=data["content"]):
                        # Convert to JSON and add newline
                        yield json.dumps(message) + "\n"
                        # Save the history as its generated
@ -729,6 +680,9 @@ class WebServer:
                        "X-Accel-Buffering": "no"  # Prevents Nginx buffering if you're using it
                    }
                )
            except Exception as e:
                logging.error(f"Error in post_chat_endpoint: {e}")
                return JSONResponse({"error": str(e)}, status_code=500)
        @self.app.post("/api/context")
        async def create_context():
@ -878,6 +832,69 @@ class WebServer:
        ctx = round(context + len(str(messages)) * 3 / 4)
        return max(defines.max_context, min(2048, ctx + ctx_buffer))
    # %%
    async def handle_tool_calls(self, message):
        """
        Process tool calls and yield status updates along the way.
        The last yielded item will be a tuple containing (tool_result, tools_used).
        """
        tools_used = []
        all_responses = []
        for i, tool_call in enumerate(message["tool_calls"]):
            arguments = tool_call["function"]["arguments"]
            tool = tool_call["function"]["name"]
            # Yield status update before processing each tool
            yield {"status": "processing", "message": f"Processing tool {i+1}/{len(message['tool_calls'])}: {tool}..."}
            # Process the tool based on its type
            match tool:
                case "TickerValue":
                    ticker = arguments.get("ticker")
                    if not ticker:
                        ret = None
                    else:
                        ret = TickerValue(ticker)
                    tools_used.append({ "tool": f"{tool}({ticker})", "result": ret})
                case "AnalyzeSite":
                    url = arguments.get("url")
                    question = arguments.get("question", "what is the summary of this content?")
                    # Additional status update for long-running operations
                    yield {"status": "processing", "message": f"Retrieving and summarizing content from {url}..."}
                    ret = await AnalyzeSite(llm=self.llm, model=self.model, url=url, question=question)
                    tools_used.append({ "tool": f"{tool}('{url}', '{question}')", "result": ret })
                case "DateTime":
                    tz = arguments.get("timezone")
                    ret = DateTime(tz)
                    tools_used.append({ "tool": f"{tool}('{tz}')", "result": ret })
                case "WeatherForecast":
                    city = arguments.get("city")
                    state = arguments.get("state")
                    yield {"status": "processing", "message": f"Fetching weather data for {city}, {state}..."}
                    ret = WeatherForecast(city, state)
                    tools_used.append({ "tool": f"{tool}('{city}', '{state}')", "result": ret })
                case _:
                    ret = None
            # Build response for this tool
            tool_response = {
                "role": "tool",
                "content": str(ret),
                "name": tool_call["function"]["name"]
            }
            all_responses.append(tool_response)
        # Yield the final result as the last item
        final_result = all_responses[0] if len(all_responses) == 1 else all_responses
        yield (final_result, tools_used)
    def upsert_context(self, context_id = None) -> Context:
        """
        Upsert a context based on the provided context_id.
@ -956,7 +973,7 @@ class WebServer:
    # * First message sets Fact Check and is Q&A
    #   * Has content
    # * Then Q&A of Fact Check
-    async def generate_response(self, context : Context, session_type : str, content : str):
+    async def generate_response(self, context : Context, session : Session, content : str):
        if not self.file_watcher:
            return
@ -967,21 +984,6 @@ class WebServer:
        self.processing = True
        # Check if the session_type is valid
        if not context.is_valid_session_type(session_type):
            yield {"status": "error", "message": f"Session type {session_type} is not invalid."}
            self.processing = False
            return
        session = context.get_session(session_type)
        if session is None:
            session = context.create_session(session_type)
        if session is None:
            yield {"status": "error", "message": f"Session type {session_type} is not invalid."}
            self.processing = False
            return
        conversation : Conversation = session.conversation
        message = Message(prompt=content)
@ -997,17 +999,18 @@ class WebServer:
            enable_rag = False
        # RAG is disabled when asking questions about the resume
-        if session_type == "resume":
+        if session.session_type == "resume":
            enable_rag = False
        # The first time through each session session_type a content_seed may be set for
        # future chat sessions; use it once, then clear it
        message.preamble = session.get_and_reset_content_seed()
        system_prompt = session.system_prompt
        # After the first time a particular session session_type is used, it is handled as a chat.
        # The number of messages indicating the session is ready for chat varies based on 
        # the session_type of session
-        process_type = session_type
+        process_type = session.session_type
        match process_type:
            case "job_description":
                logging.info(f"job_description user_history len: {len(conversation.messages)}")
@ -1029,8 +1032,7 @@ class WebServer:
                    self.processing = False
                    return
-                logging.info("TODO: Re-enable tools...")
+                enable_tools = True
                #enable_tools = True
                # Generate RAG content if enabled, based on the content
                rag_context = ""
@ -1069,8 +1071,7 @@ class WebServer:
 Use that information to respond to:"""
                # Use the mode specific system_prompt instead of 'chat'
-                logging.info("Fix this... reimplement")
+                system_prompt = session.system_prompt
                #system_prompt = context.get_session(session_type).system_prompt
            # On first entry, a single job_description is provided ("user")
            # Generate a resume to append to RESUME history
@ -1109,8 +1110,11 @@ Use that information to respond to:"""
 <|job_description|>
 {message.prompt}
 """
-                
+                tmp = context.get_session("job_description")
-                context.get_or_create_session("job_description").set_content_seed(message.preamble + "<|question|>\nUse the above information to respond to this prompt: ")
+                if not tmp:
                    raise Exception(f"Job description session not found.")
                # Set the content seed for the job_description session
                tmp.set_content_seed(message.preamble + "<|question|>\nUse the above information to respond to this prompt: ")
                message.preamble += f"""
 <|rules|>
@ -1118,24 +1122,30 @@ Use that information to respond to:"""
 2. Do not use content from the <|job_description|> in the response unless the <|context|> or <|resume|> mentions them.
 <|question|>
-Respond to the above information to respond to this prompt: "
+Use to the above information to respond to this prompt: 
 """
                # For all future calls to job_description, use the system_job_description
                session.system_prompt = system_job_description
                # Seed the history for job_description
-                messages = [ {
+                stuffingMessage = Message(prompt=message.prompt)
-                    "role": "user", "content": message.prompt
+                stuffingMessage.response = "Job description stored to use in future queries."
-                }, {
+                stuffingMessage.metadata["origin"] = "job_description"
-                    "role": "assistant", "content": "Job description stored to use in future queries.", "display": "hide"
+                stuffingMessage.metadata["display"] = "hide"
-                } ]
+                conversation.add_message(stuffingMessage)
-                # Strip out the 'display' key when adding to llm_history
+
-                conversation.extend([{**m, "origin": "job_description"} for m in messages])
+                message.add_action("generate_resume")
                logging.info("TODO: Convert these to generators, eg generate_resume() and then manually add results into session'resume'")
                logging.info("TODO: For subsequent runs, have the Session handler generate the follow up prompts so they can have correct context preamble")
                # Switch to resume session for LLM responses
-                message.metadata["origin"] = "resume"
+                # message.metadata["origin"] = "resume"
-                session = context.get_or_create_session("resume")
+                # session = context.get_or_create_session("resume")
-                system_prompt = session.system_prompt
+                # system_prompt = session.system_prompt
-                llm_history = session.llm_history = []
+                # llm_history = session.llm_history = []
-                user_history = session.user_history = []
+                # user_history = session.user_history = []
            # Ignore the passed in content and invoke Fact Check
            case "resume":
@ -1203,12 +1213,22 @@ Use the above <|resume|> and <|job_description|> to answer this query:
                    "role": "assistant", "content": "Resume fact checked.", "origin": "resume", "display": "hide"
                } ]
                # Do not add this to the LLM history; it is only used for UI presentation
-                conversation.extend(messages)
+                stuffingMessage = Message(prompt="Fact check resume")
                stuffingMessage.response = "Resume fact checked."
                stuffingMessage.metadata["origin"] = "resume"
                stuffingMessage.metadata["display"] = "hide"
                stuffingMessage.actions = [ "fact_check" ]
                logging.info("TODO: Switch this to use actions to keep the UI from showingit")
                conversation.add_message(stuffingMessage)
                # For all future calls to job_description, use the system_job_description
                logging.info("TODO: Create a system_resume_QA prompt to use for the resume session")
                session.system_prompt = system_prompt
                # Switch to fact_check session for LLM responses
                message.metadata["origin"] = "fact_check"
-                session = context.get_or_create_session("fact_check")
+                session = context.get_or_create_session("fact_check", system_prompt=system_fact_check)
-                system_prompt = session.system_prompt
+
                llm_history = session.llm_history = []
                user_history = session.user_history = []
@ -1220,7 +1240,8 @@ Use the above <|resume|> and <|job_description|> to answer this query:
        # user_history.append({"role": "user", "content": content, "origin": message.metadata["origin"]})
        # message.metadata["full_query"] = llm_history[-1]["content"]
-        messages = create_system_message(session.system_prompt)
+        # Uses cached system_prompt as session.system_prompt may have been updated for follow up questions
        messages = create_system_message(system_prompt)
        if context.message_history_length:
            to_add = conversation.messages[-context.message_history_length:]
        else:
@ -1233,18 +1254,30 @@ Use the above <|resume|> and <|job_description|> to answer this query:
                "role": "assistant",
                "content": m.response,
            } ])
        message.content = message.preamble + message.prompt
        # To send to the LLM
        messages.append({
            "role": "user",
-            "content": message.preamble + message.prompt,
+            "content": message.content
        })
        # Add the system message to the beginning of the messages list
        message.content = f"""
 <|system_prompt|>
 {system_prompt}
 {message.preamble}
 {message.prompt}"""
        # Estimate token length of new messages
        ctx_size = self.get_optimal_ctx_size(context.get_or_create_session(process_type).context_tokens, messages=message.prompt)
        if len(conversation.messages) > 2:
            processing_message = f"Processing {'RAG augmented ' if enable_rag else ''}query..."
        else:
-            match session_type:
+            match session.session_type:
                case "job_description":
                    processing_message = f"Generating {'RAG augmented ' if enable_rag else ''}resume..."
                case "resume":
@ -1283,7 +1316,7 @@ Use the above <|resume|> and <|job_description|> to answer this query:
            tool_result = None
            # Process all yielded items from the handler
-            async for item in handle_tool_calls(tool_message):
+            async for item in self.handle_tool_calls(tool_message):
                if isinstance(item, tuple) and len(item) == 2:
                    # This is the final result tuple (tool_result, tools_used)
                    tool_result, tools_used = item
@ -1326,7 +1359,7 @@ Use the above <|resume|> and <|job_description|> to answer this query:
        reply = response["message"]["content"]
        message.response = reply
-        message.metadata["origin"] = session_type
+        message.metadata["origin"] = session.session_type
        # final_message = {"role": "assistant", "content": reply }
        # # history is provided to the LLM and should not have additional metadata
@ -1341,9 +1374,7 @@ Use the above <|resume|> and <|job_description|> to answer this query:
        yield {
            "status": "done", 
            "message": {
-                "role": "assistant",
+                **message.model_dump(mode='json'),
                "content": message.response,
                "metadata": message.metadata
            }
        }
--- a/src/utils/context.py
+++ b/src/utils/context.py
@ -54,7 +54,7 @@ class Context(BaseModel):
        # Find the matching subclass
        for session_cls in Session.__subclasses__():
-            if session_cls.__fields__["session_type"].default == session_type:
+            if session_cls.model_fields["session_type"].default == session_type:
                # Create the session instance with provided kwargs
                session = session_cls(session_type=session_type, **kwargs)
                self.sessions.append(session)
--- a/src/utils/conversation.py
+++ b/src/utils/conversation.py
@ -1,6 +1,5 @@
 from pydantic import BaseModel
 from typing import List
 from datetime import datetime, timezone
 from .message import Message
 class Conversation(BaseModel):
--- a/src/utils/message.py
+++ b/src/utils/message.py
@ -18,6 +18,13 @@ class Message(BaseModel):
    actions: List[str] = []
    timestamp: datetime = datetime.now(timezone.utc)
    def add_action(self, action: str | list[str]) -> None:
        """Add a actions(s) to the message."""
        if isinstance(action, str):
          self.actions.append(action)
        else:
          self.actions.extend(action)
    def get_summary(self) -> str:
        """Return a summary of the message."""
        response_summary = (
--- a/src/utils/session.py
+++ b/src/utils/session.py
@ -4,7 +4,7 @@ from .conversation import Conversation
 class Session(BaseModel):
    session_type: Literal["resume", "job_description", "fact_check", "chat"]
-    system_prompt: str = "You are a helpful assistant."
+    system_prompt: str # Mandatory
    conversation: Conversation = Conversation()
    context_tokens: int = 0