goose/ui/desktop/src/hooks/useMessageStream.ts

import { useState, useCallback, useEffect, useRef, useId, useReducer } from 'react';
import useSWR from 'swr';
import { getSecretKey } from '../config';
import { Message, createUserMessage, hasCompletedToolCalls } from '../types/message';
import { getSessionHistory } from '../api';

let messageIdCounter = 0;

function generateMessageId(): string {
  return `msg-${Date.now()}-${++messageIdCounter}`;
}

// Ensure TextDecoder is available in the global scope
const TextDecoder = globalThis.TextDecoder;

type JsonValue = string | number | boolean | null | JsonValue[] | { [key: string]: JsonValue };

export interface SessionMetadata {
  workingDir: string;
  description: string;
  scheduleId: string | null;
  messageCount: number;
  totalTokens: number | null;
  inputTokens: number | null;
  outputTokens: number | null;
  accumulatedTotalTokens: number | null;
  accumulatedInputTokens: number | null;
  accumulatedOutputTokens: number | null;
}

export interface NotificationEvent {
  type: 'Notification';
  request_id: string;
  message: {
    method: string;
    params: {
      [key: string]: JsonValue;
    };
  };
}

// Event types for SSE stream
type MessageEvent =
  | { type: 'Message'; message: Message }
  | { type: 'Error'; error: string }
  | { type: 'Finish'; reason: string }
  | { type: 'ModelChange'; model: string; mode: string }
  | NotificationEvent;

export interface UseMessageStreamOptions {
  /**
   * The API endpoint that accepts a `{ messages: Message[] }` object and returns
   * a stream of messages. Defaults to `/api/chat/reply`.
   */
  api?: string;

  /**
   * A unique identifier for the chat. If not provided, a random one will be
   * generated. When provided, the hook with the same `id` will
   * have shared states across components.
   */
  id?: string;

  /**
   * Initial messages of the chat. Useful to load an existing chat history.
   */
  initialMessages?: Message[];

  /**
   * Initial input of the chat.
   */
  initialInput?: string;

  /**
   * Callback function to be called when a tool call is received.
   * You can optionally return a result for the tool call.
   */
  _onToolCall?: (toolCall: Record<string, unknown>) => void | Promise<unknown> | unknown;

  /**
   * Callback function to be called when the API response is received.
   */
  onResponse?: (response: Response) => void | Promise<void>;

  /**
   * Callback function to be called when the assistant message is finished streaming.
   */
  onFinish?: (message: Message, reason: string) => void;

  /**
   * Callback function to be called when an error is encountered.
   */
  onError?: (error: Error) => void;

  /**
   * HTTP headers to be sent with the API request.
   */
  headers?: Record<string, string> | HeadersInit;

  /**
   * Extra body object to be sent with the API request.
   */
  body?: object;

  /**
   * Maximum number of sequential LLM calls (steps), e.g. when you use tool calls.
   * Default is 1.
   */
  maxSteps?: number;
}

export interface UseMessageStreamHelpers {
  /** Current messages in the chat */
  messages: Message[];

  /** The error object of the API request */
  error: undefined | Error;

  /**
   * Append a user message to the chat list. This triggers the API call to fetch
   * the assistant's response.
   */
  append: (message: Message | string) => Promise<void>;

  /**
   * Reload the last AI chat response for the given chat history.
   */
  reload: () => Promise<void>;

  /**
   * Abort the current request immediately.
   */
  stop: () => void;

  /**
   * Update the `messages` state locally.
   */
  setMessages: (messages: Message[] | ((messages: Message[]) => Message[])) => void;

  /** The current value of the input */
  input: string;

  /** setState-powered method to update the input value */
  setInput: React.Dispatch<React.SetStateAction<string>>;

  /** An input/textarea-ready onChange handler to control the value of the input */
  handleInputChange: (
    e: React.ChangeEvent<HTMLInputElement> | React.ChangeEvent<HTMLTextAreaElement>
  ) => void;

  /** Form submission handler to automatically reset input and append a user message */
  handleSubmit: (event?: { preventDefault?: () => void }) => void;

  /** Whether the API request is in progress */
  isLoading: boolean;

  /** Whether we're waiting for the first response from LLM */
  isWaiting: boolean;

  /** Whether we're actively streaming response content */
  isStreaming: boolean;

  /** Add a tool result to a tool call */
  addToolResult: ({ toolCallId, result }: { toolCallId: string; result: unknown }) => void;

  /** Modify body (session id and/or work dir mid-stream) **/
  updateMessageStreamBody?: (newBody: object) => void;

  notifications: NotificationEvent[];

  /** Current model info from the backend */
  currentModelInfo: { model: string; mode: string } | null;

  /** Session metadata including token counts */
  sessionMetadata: SessionMetadata | null;

  /** Clear error state */
  setError: (error: Error | undefined) => void;
}

/**
 * Hook for streaming messages directly from the server using the native Goose message format
 */
export function useMessageStream({
  api = '/api/chat/reply',
  id,
  initialMessages = [],
  initialInput = '',
  onResponse,
  onFinish,
  onError,
  headers,
  body,
  maxSteps = 1,
}: UseMessageStreamOptions = {}): UseMessageStreamHelpers {
  // Generate a unique id for the chat if not provided
  const hookId = useId();
  const idKey = id ?? hookId;
  const chatKey = typeof api === 'string' ? [api, idKey] : idKey;

  // Store the chat state in SWR, using the chatId as the key to share states
  const { data: messages, mutate } = useSWR<Message[]>([chatKey, 'messages'], null, {
    fallbackData: initialMessages,
  });

  const [notifications, setNotifications] = useState<NotificationEvent[]>([]);
  const [currentModelInfo, setCurrentModelInfo] = useState<{ model: string; mode: string } | null>(
    null
  );
  const [sessionMetadata, setSessionMetadata] = useState<SessionMetadata | null>(null);

  // expose a way to update the body so we can update the session id when CLE occurs
  const updateMessageStreamBody = useCallback((newBody: object) => {
    extraMetadataRef.current.body = {
      ...extraMetadataRef.current.body,
      ...newBody,
    };
  }, []);

  // Keep the latest messages in a ref
  const messagesRef = useRef<Message[]>(messages || []);
  useEffect(() => {
    messagesRef.current = messages || [];
  }, [messages]);

  // We store loading state in another hook to sync loading states across hook invocations
  const { data: isLoading = false, mutate: mutateLoading } = useSWR<boolean>(
    [chatKey, 'loading'],
    null
  );

  // Track waiting vs streaming states
  const { data: isWaiting = false, mutate: mutateWaiting } = useSWR<boolean>(
    [chatKey, 'waiting'],
    null
  );

  const { data: isStreaming = false, mutate: mutateStreaming } = useSWR<boolean>(
    [chatKey, 'streaming'],
    null
  );

  const { data: error = undefined, mutate: setError } = useSWR<undefined | Error>(
    [chatKey, 'error'],
    null
  );

  // Abort controller to cancel the current API call
  const abortControllerRef = useRef<AbortController | null>(null);

  // Extra metadata for requests
  const extraMetadataRef = useRef({
    headers,
    body,
  });

  useEffect(() => {
    extraMetadataRef.current = {
      headers,
      body,
    };
  }, [headers, body]);

  // TODO: not this?
  const [, forceUpdate] = useReducer((x) => x + 1, 0);

  // Process the SSE stream from the server
  const processMessageStream = useCallback(
    async (response: Response, currentMessages: Message[]) => {
      if (!response.body) {
        throw new Error('Response body is empty');
      }

      const reader = response.body.getReader();
      const decoder = new TextDecoder();
      let buffer = '';

      try {
        let running = true;
        while (running) {
          const { done, value } = await reader.read();
          if (done) {
            running = false;
            break;
          }

          // Decode the chunk and add it to our buffer
          buffer += decoder.decode(value, { stream: true });

          // Process complete SSE events
          const events = buffer.split('\n\n');
          buffer = events.pop() || ''; // Keep the last incomplete event in the buffer

          for (const event of events) {
            if (event.startsWith('data: ')) {
              try {
                const data = event.slice(6); // Remove 'data: ' prefix
                const parsedEvent = JSON.parse(data) as MessageEvent;

                switch (parsedEvent.type) {
                  case 'Message': {
                    // Transition from waiting to streaming on first message
                    mutateWaiting(false);
                    mutateStreaming(true);

                    // Create a new message object with the properties preserved or defaulted
                    const newMessage = {
                      ...parsedEvent.message,
                      // Ensure the message has an ID - if not provided, generate one
                      id: parsedEvent.message.id || generateMessageId(),
                      // Only set to true if it's undefined (preserve false values)
                      display:
                        parsedEvent.message.display === undefined
                          ? true
                          : parsedEvent.message.display,
                      sendToLLM:
                        parsedEvent.message.sendToLLM === undefined
                          ? true
                          : parsedEvent.message.sendToLLM,
                    };

                    // Update messages with the new message
                    if (
                      newMessage.id &&
                      currentMessages.length > 0 &&
                      currentMessages[currentMessages.length - 1].id === newMessage.id
                    ) {
                      // If the last message has the same ID, update it instead of adding a new one
                      const lastMessage = currentMessages[currentMessages.length - 1];
                      lastMessage.content = [...lastMessage.content, ...newMessage.content];
                      forceUpdate();
                    } else {
                      currentMessages = [...currentMessages, newMessage];
                    }

                    mutate(currentMessages, false);
                    break;
                  }

                  case 'Notification': {
                    const newNotification = {
                      ...parsedEvent,
                    };
                    setNotifications((prev) => [...prev, newNotification]);
                    break;
                  }

                  case 'ModelChange': {
                    // Update the current model in the frontend
                    const modelInfo = {
                      model: parsedEvent.model,
                      mode: parsedEvent.mode,
                    };
                    setCurrentModelInfo(modelInfo);
                    break;
                  }

                  case 'Error': {
                    // Check if this is a token limit error (more specific detection)
                    const errorMessage = parsedEvent.error;
                    const isTokenLimitError =
                      errorMessage &&
                      ((errorMessage.toLowerCase().includes('token') &&
                        errorMessage.toLowerCase().includes('limit')) ||
                        (errorMessage.toLowerCase().includes('context') &&
                          errorMessage.toLowerCase().includes('length') &&
                          errorMessage.toLowerCase().includes('exceeded')));

                    // If this is a token limit error, create a contextLengthExceeded message instead of throwing
                    if (isTokenLimitError) {
                      const contextMessage: Message = {
                        id: generateMessageId(),
                        role: 'assistant',
                        created: Math.floor(Date.now() / 1000),
                        content: [
                          {
                            type: 'contextLengthExceeded',
                            msg: errorMessage,
                          },
                        ],
                        display: true,
                        sendToLLM: false,
                      };

                      currentMessages = [...currentMessages, contextMessage];
                      mutate(currentMessages, false);

                      // Clear any existing error state since we handled this as a context message
                      setError(undefined);
                      break; // Don't throw error, just add the message
                    }

                    // For non-token-limit errors, still throw the error
                    const error = new Error(parsedEvent.error);
                    throw error;
                  }

                  case 'Finish': {
                    // Call onFinish with the last message if available
                    if (onFinish && currentMessages.length > 0) {
                      const lastMessage = currentMessages[currentMessages.length - 1];
                      onFinish(lastMessage, parsedEvent.reason);
                    }

                    // Fetch updated session metadata with token counts
                    const sessionId = (extraMetadataRef.current.body as Record<string, unknown>)
                      ?.session_id as string;
                    if (sessionId) {
                      try {
                        const sessionResponse = await getSessionHistory({
                          path: { session_id: sessionId },
                        });

                        if (sessionResponse.data?.metadata) {
                          setSessionMetadata({
                            workingDir: sessionResponse.data.metadata.working_dir,
                            description: sessionResponse.data.metadata.description,
                            scheduleId: sessionResponse.data.metadata.schedule_id || null,
                            messageCount: sessionResponse.data.metadata.message_count,
                            totalTokens: sessionResponse.data.metadata.total_tokens || null,
                            inputTokens: sessionResponse.data.metadata.input_tokens || null,
                            outputTokens: sessionResponse.data.metadata.output_tokens || null,
                            accumulatedTotalTokens:
                              sessionResponse.data.metadata.accumulated_total_tokens || null,
                            accumulatedInputTokens:
                              sessionResponse.data.metadata.accumulated_input_tokens || null,
                            accumulatedOutputTokens:
                              sessionResponse.data.metadata.accumulated_output_tokens || null,
                          });
                        }
                      } catch (error) {
                        console.error('Failed to fetch session metadata:', error);
                      }
                    }
                    break;
                  }
                }
              } catch (e) {
                console.error('Error parsing SSE event:', e);
                if (onError && e instanceof Error) {
                  onError(e);
                }
                // Don't re-throw here, let the error be handled by the outer catch
                // Instead, set the error state directly
                if (e instanceof Error) {
                  setError(e);
                }
              }
            }
          }
        }
      } catch (e) {
        if (e instanceof Error && e.name !== 'AbortError') {
          console.error('Error reading SSE stream:', e);
          if (onError) {
            onError(e);
          }
          // Re-throw the error so it gets caught by sendRequest and sets the error state
          throw e;
        }
      } finally {
        reader.releaseLock();
      }

      return currentMessages;
    },
    [mutate, mutateWaiting, mutateStreaming, onFinish, onError, forceUpdate, setError]
  );

  // Send a request to the server
  const sendRequest = useCallback(
    async (requestMessages: Message[]) => {
      try {
        mutateLoading(true);
        mutateWaiting(true); // Start in waiting state
        mutateStreaming(false);
        setError(undefined);

        // Create abort controller
        const abortController = new AbortController();
        abortControllerRef.current = abortController;

        // Filter out messages where sendToLLM is explicitly false
        const filteredMessages = requestMessages.filter((message) => message.sendToLLM !== false);

        // Send request to the server
        const response = await fetch(api, {
          method: 'POST',
          headers: {
            'Content-Type': 'application/json',
            'X-Secret-Key': getSecretKey(),
            ...extraMetadataRef.current.headers,
          },
          body: JSON.stringify({
            messages: filteredMessages,
            ...extraMetadataRef.current.body,
          }),
          signal: abortController.signal,
        });

        if (onResponse) {
          await onResponse(response);
        }

        if (!response.ok) {
          const text = await response.text();
          throw new Error(text || `Error ${response.status}: ${response.statusText}`);
        }

        // Process the SSE stream
        const updatedMessages = await processMessageStream(response, requestMessages);

        // Auto-submit when all tool calls in the last assistant message have results
        if (maxSteps > 1 && updatedMessages.length > requestMessages.length) {
          const lastMessage = updatedMessages[updatedMessages.length - 1];
          if (lastMessage.role === 'assistant' && hasCompletedToolCalls(lastMessage)) {
            // Count trailing assistant messages to prevent infinite loops
            let assistantCount = 0;
            for (let i = updatedMessages.length - 1; i >= 0; i--) {
              if (updatedMessages[i].role === 'assistant') {
                assistantCount++;
              } else {
                break;
              }
            }

            if (assistantCount < maxSteps) {
              await sendRequest(updatedMessages);
            }
          }
        }

        abortControllerRef.current = null;
      } catch (err) {
        // Ignore abort errors as they are expected
        if (err instanceof Error && err.name === 'AbortError') {
          abortControllerRef.current = null;
          return;
        }

        if (onError && err instanceof Error) {
          onError(err);
        }

        setError(err as Error);
      } finally {
        mutateLoading(false);
        mutateWaiting(false);
        mutateStreaming(false);
      }
    },
    // eslint-disable-next-line react-hooks/exhaustive-deps
    [
      api,
      processMessageStream,
      mutateLoading,
      mutateWaiting,
      mutateStreaming,
      setError,
      onResponse,
      onError,
      maxSteps,
    ]
  );

  // Append a new message and send request
  const append = useCallback(
    async (message: Message | string) => {
      // If a string is passed, convert it to a Message object
      const messageToAppend = typeof message === 'string' ? createUserMessage(message) : message;

      const currentMessages = [...messagesRef.current, messageToAppend];
      mutate(currentMessages, false);
      await sendRequest(currentMessages);
    },
    [mutate, sendRequest]
  );

  // Reload the last message
  const reload = useCallback(async () => {
    const currentMessages = messagesRef.current;
    if (currentMessages.length === 0) {
      return;
    }

    // Remove last assistant message if present
    const lastMessage = currentMessages[currentMessages.length - 1];
    const messagesToSend =
      lastMessage.role === 'assistant' ? currentMessages.slice(0, -1) : currentMessages;

    await sendRequest(messagesToSend);
  }, [sendRequest]);

  // Stop the current request
  const stop = useCallback(() => {
    if (abortControllerRef.current) {
      abortControllerRef.current.abort();
      abortControllerRef.current = null;
    }
  }, []);

  // Set messages directly
  const setMessages = useCallback(
    (messagesOrFn: Message[] | ((messages: Message[]) => Message[])) => {
      if (typeof messagesOrFn === 'function') {
        const newMessages = messagesOrFn(messagesRef.current);
        mutate(newMessages, false);
        messagesRef.current = newMessages;
      } else {
        mutate(messagesOrFn, false);
        messagesRef.current = messagesOrFn;
      }
    },
    [mutate]
  );

  // Input state and handlers
  const [input, setInput] = useState(initialInput);

  const handleInputChange = useCallback(
    (e: React.ChangeEvent<HTMLInputElement> | React.ChangeEvent<HTMLTextAreaElement>) => {
      setInput(e.target.value);
    },
    []
  );

  const handleSubmit = useCallback(
    async (event?: { preventDefault?: () => void }) => {
      event?.preventDefault?.();
      if (!input.trim()) return;

      await append(input);
      setInput('');
    },
    [input, append]
  );

  // Add tool result to a message
  const addToolResult = useCallback(
    ({ toolCallId, result }: { toolCallId: string; result: unknown }) => {
      const currentMessages = messagesRef.current;

      // Find the last assistant message with the tool call
      let lastAssistantIndex = -1;
      for (let i = currentMessages.length - 1; i >= 0; i--) {
        if (currentMessages[i].role === 'assistant') {
          const toolRequests = currentMessages[i].content.filter(
            (content) => content.type === 'toolRequest' && content.id === toolCallId
          );
          if (toolRequests.length > 0) {
            lastAssistantIndex = i;
            break;
          }
        }
      }

      if (lastAssistantIndex === -1) return;

      // Create a tool response message
      const toolResponseMessage: Message = {
        id: generateMessageId(),
        role: 'user' as const,
        created: Math.floor(Date.now() / 1000),
        content: [
          {
            type: 'toolResponse' as const,
            id: toolCallId,
            toolResult: {
              status: 'success' as const,
              value: Array.isArray(result)
                ? result
                : [{ type: 'text' as const, text: String(result), priority: 0 }],
            },
          },
        ],
      };

      // Insert the tool response after the assistant message
      const updatedMessages = [
        ...currentMessages.slice(0, lastAssistantIndex + 1),
        toolResponseMessage,
        ...currentMessages.slice(lastAssistantIndex + 1),
      ];

      mutate(updatedMessages, false);
      messagesRef.current = updatedMessages;

      // Auto-submit if we have tool results
      if (maxSteps > 1) {
        sendRequest(updatedMessages);
      }
    },
    [mutate, maxSteps, sendRequest]
  );

  return {
    messages: messages || [],
    error,
    append,
    reload,
    stop,
    setMessages,
    input,
    setInput,
    handleInputChange,
    handleSubmit,
    isLoading: isLoading || false,
    isWaiting: isWaiting || false,
    isStreaming: isStreaming || false,
    addToolResult,
    updateMessageStreamBody,
    notifications,
    currentModelInfo,
    sessionMetadata,
    setError,
  };
}