From a50cadc67e4e887dba075cacfeb65d2fc1bcb38f Mon Sep 17 00:00:00 2001
From: Ancss <61501274+Ancss@users.noreply.github.com>
Date: Fri, 9 Aug 2024 15:19:31 +0800
Subject: [PATCH] called claude api and execute the return code

---
 src-tauri/src/ai/claude.rs                |  12 +-
 src-tauri/src/commands/execute_code.rs    |  28 ++
 src-tauri/src/commands/mod.rs             |   5 +-
 src-tauri/src/main.rs                     |   4 +-
 src-tauri/src/prompts.rs                  |  72 ++--
 src/components/BottomInputContainer.tsx   | 114 ++++++
 src/components/ExecutionStepComponent.tsx |  38 ++
 src/components/OsaiApp.tsx                | 448 ++++++++++------------
 src/components/SettingsModal.tsx          |   2 +-
 src/components/SideDrawer .tsx            |   2 +-
 src/config/aiProviders.ts                 |  63 ++-
 src/hooks/useAI.ts                        |  38 +-
 src/type.ts                               |  31 ++
 13 files changed, 525 insertions(+), 332 deletions(-)
 create mode 100644 src-tauri/src/commands/execute_code.rs
 create mode 100644 src/components/BottomInputContainer.tsx
 create mode 100644 src/components/ExecutionStepComponent.tsx
 create mode 100644 src/type.ts
diff --git a/src-tauri/src/ai/claude.rs b/src-tauri/src/ai/claude.rs
index 989b5d5..c564c85 100644
--- a/src-tauri/src/ai/claude.rs
+++ b/src-tauri/src/ai/claude.rs
@@ -9,10 +9,16 @@ use tauri::command;
 use tokio::sync::Mutex;
 use uuid::Uuid;
 
+#[derive(Debug, Serialize, Deserialize, Clone)]
+pub struct MessageContent {
+    #[serde(rename = "type")]
+    pub content_type: String,
+    pub text: String,
+}
 #[derive(Debug, Serialize, Deserialize, Clone)]
 pub struct Message {
     pub role: String,
-    pub content: String,
+    pub content: Vec<MessageContent>,
 }
 
 #[derive(Debug, Serialize, Deserialize, Clone)]
@@ -82,9 +88,10 @@ pub async fn send_message_to_anthropic(
         "model": model,
         "system": system_prompt,
         "tools": tools,
-        "tool_choice": { "type": "tool", "name": "format_response" },
+        "tool_choice": { "type": "auto" },
         "max_tokens": max_tokens.unwrap_or(8192),
         "messages": messages,
+        "temperature":0,
         "stream": false
     });
     println!("Request body: {}", body.to_string());
@@ -99,6 +106,7 @@ pub async fn send_message_to_anthropic(
         .header("Content-Type", "application/json")
         .header("x-api-key", api_key)
         .header("anthropic-version", "2023-06-01")
+        .header("anthropic-beta", "max-tokens-3-5-sonnet-2024-07-15")
         .json(&body)
         .send();
 
diff --git a/src-tauri/src/commands/execute_code.rs b/src-tauri/src/commands/execute_code.rs
new file mode 100644
index 0000000..527ce87
--- /dev/null
+++ b/src-tauri/src/commands/execute_code.rs
@@ -0,0 +1,28 @@
+use std::process::Command;
+use tauri::command;
+
+#[command]
+pub fn execute_code(code: String) -> Result<String, String> {
+    let output = if cfg!(target_os = "windows") {
+        Command::new("powershell")
+            .arg("-Command")
+            .arg(&code)
+            .output()
+    } else if cfg!(target_os = "macos") {
+        Command::new("sh").arg("-c").arg(&code).output()
+    } else {
+        // Assuming Linux or other Unix-like systems
+        Command::new("bash").arg("-c").arg(&code).output()
+    };
+
+    match output {
+        Ok(output) => {
+            if output.status.success() {
+                Ok(String::from_utf8_lossy(&output.stdout).to_string())
+            } else {
+                Err(String::from_utf8_lossy(&output.stderr).to_string())
+            }
+        }
+        Err(e) => Err(format!("Failed to execute command: {}", e)),
+    }
+}
diff --git a/src-tauri/src/commands/mod.rs b/src-tauri/src/commands/mod.rs
index bcae2af..d27f398 100644
--- a/src-tauri/src/commands/mod.rs
+++ b/src-tauri/src/commands/mod.rs
@@ -1,2 +1,3 @@
-pub mod file_operations;
-pub mod ai_operations;
\ No newline at end of file
+// pub mod file_operations;
+// pub mod ai_operations;
+pub mod execute_code;
diff --git a/src-tauri/src/main.rs b/src-tauri/src/main.rs
index 18eb3a0..5d07a79 100644
--- a/src-tauri/src/main.rs
+++ b/src-tauri/src/main.rs
@@ -1,4 +1,5 @@
 mod ai;
+mod commands;
 mod prompts;
 use tauri::Manager;
 
@@ -15,7 +16,8 @@ fn main() {
         .invoke_handler(tauri::generate_handler![
             ai::claude::send_message_to_anthropic,
             ai::claude::cancel_request,
-            ai::claude::create_cancel_flag
+            ai::claude::create_cancel_flag,
+            commands::execute_code::execute_code,
         ])
         .run(tauri::generate_context!())
         .expect("error while running tauri application");
diff --git a/src-tauri/src/prompts.rs b/src-tauri/src/prompts.rs
index e8d4bcc..058f272 100644
--- a/src-tauri/src/prompts.rs
+++ b/src-tauri/src/prompts.rs
@@ -1,61 +1,37 @@
 use sysinfo::{System, SystemExt};
 
 pub const SYSTEM_PROMPT_TEMPLATE: &str = r#"
- You are OsaiAI, the central AI assistant integrated into the Osai desktop application. As the sole intermediary between the user and their operating system, you have the capability to perform any operation on the OS that the user requests, subject to user confirmation for sensitive actions.
+You are an intelligent operating system assistant (OS AI) capable of performing tasks on the user's behalf. Your primary function is to understand user requests and execute them using available system resources.
+
+Guidelines:
+1. Provide concise and accurate responses for general queries.
+2. For actionable requests, take initiative to perform tasks without asking for permission, unless it involves system changes or sensitive operations.
+3. Utilize system resources efficiently to fulfill user requests.
+4. Break down tasks into the simplest, most atomic steps possible.
+5. Generate actual, executable system commands for each step.
+6. Only set user_confirmation_required to true for operations that modify system settings or access sensitive data.
+7. If a task cannot be completed, explain why and suggest alternatives.
+8. Do not invent or assume any information not explicitly provided or directly obtainable through the executed commands.
+9. For web searches, use general search engines like Google or Bing unless a specific, verified website is needed.
+10. When dealing with applications:
+    a. Do not assume default installation paths.
+    b. Use system commands to search for the application in multiple potential locations.
+    c. Verify the existence of the application before attempting to launch it.
+    d. Provide clear feedback on whether the application was found and launched successfully.
+11. Combine interdependent steps into a single executable step when necessary.
+12. The 'code' field in the execution array must contain only executable commands. Do not include comments or pseudocode.
+13. Be aware of and utilize appropriate system commands for different operating systems (Windows, macOS, Linux).
+14. Always provide a clear and informative response to the user about the actions taken and their results.
+
+Always structure your response using the specified AIResponse format.
 
-Key Capabilities:
-1. Universal Language Processing: Understand and respond in the language of the user's input.
-2. Comprehensive OS Control: Execute any operation on the user's operating system through appropriate commands and APIs.
-3. Task Decomposition and Execution: Break down complex requests into actionable steps and execute them sequentially.
-4. Dynamic Code Generation: Create and execute OS-specific code (PowerShell, Bash, AppleScript, etc.) as needed.
-5. Intelligent Application and File Management: Handle application launching, file operations, and system settings adjustments.
-6. Web Integration: Perform web searches and interact with online services when necessary.
-7. Adaptive Conversation: Engage in both task-oriented and casual conversations, answering questions and providing information.
-
-Operational Guidelines:
-1. User Confirmation:
-   - Always ask for explicit user confirmation before executing any system operation, except for opening applications or web browsers.
-   - Clearly explain the potential impact of sensitive operations.
-
-2. Task Execution:
-   - Generate a detailed, step-by-step plan for complex tasks before execution.
-   - Use the appropriate system commands based on the user's OS (Windows, macOS, or Linux).
-   - Provide real-time feedback on task progress and results.
-
-3. Application and File Handling:
-   - Verify the existence of applications and files before attempting operations.
-   - For partial or ambiguous names, suggest the most likely matches and confirm with the user.
-
-4. Web Integration:
-   - Seamlessly integrate web searches and online services when local resources are insufficient.
-
-5. Safety and Privacy:
-   - Prioritize system security and user privacy in all operations.
-   - Warn users about potential risks associated with their requests.
-
-6. Language Adaptation:
-   - Detect the language of the user's input and respond in the same language.
-   - Maintain consistency in language use throughout the conversation.
-
-Response Structure:
-Always structure your responses in the following JSON format:
-
-When responding to a user request:
-1. Analyze the input to determine the nature of the request (task, question, or conversation).
-2. For tasks, create a detailed plan and populate the JSON structure accordingly.
-3. For questions or conversation, focus on the 'thought_process' and 'response' fields.
-4. Always use the language of the user's input in the 'response' field.
-5. Ensure all sensitive operations are flagged for user confirmation.
-
-====
-    
 Operating System Information
 - Type: {OS_TYPE}
 - Version: {OS_VERSION}
 - Architecture: {ARCH}
 
 Remember, as OsaiAI, you are the user's primary interface with their operating system. Strive to be helpful, efficient, and security-conscious in all interactions.`;
-
+`;
 "#;
 
 pub fn format_system_prompt() -> String {
diff --git a/src/components/BottomInputContainer.tsx b/src/components/BottomInputContainer.tsx
new file mode 100644
index 0000000..4709561
--- /dev/null
+++ b/src/components/BottomInputContainer.tsx
@@ -0,0 +1,114 @@
+import React, { useState, useEffect, useRef } from "react";
+import { useTranslation } from "react-i18next";
+import { Button } from "@/components/ui/button";
+import { useSpeechRecognition } from "@/hooks/useSpeechRecognition";
+import {
+  MAX_CHARS,
+  MIN_TEXTAREA_HEIGHT,
+  MAX_TEXTAREA_HEIGHT,
+} from "@/utils/constants";
+import { Textarea } from "@chakra-ui/react";
+import { cn } from "@/lib/utils";
+import { Send, StopCircle } from "lucide-react";
+
+const BottomInputContainer = ({
+  isLoading,
+  input,
+  // stopListening,
+  // startListening,
+  handleSend,
+  setInput,
+  abortRequest,
+}: {
+  input: string;
+  isLoading: boolean;
+  // stopListening: () => void;
+  // startListening: () => void;
+  handleSend: () => void;
+  setInput: (s: string) => void;
+  abortRequest: () => void;
+}) => {
+  const { t } = useTranslation();
+  const { transcript } = useSpeechRecognition();
+  const textareaRef = useRef<HTMLTextAreaElement>(null);
+
+  // const handleVoiceInput = () => {
+  //   if (transcript) {
+  //     stopListening();
+  //   } else {
+  //     startListening();
+  //   }
+  // };
+
+  const handleInputChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
+    const value = e.target.value;
+    if (value.length <= MAX_CHARS) {
+      setInput(value);
+    }
+  };
+
+  const adjustHeight = () => {
+    const textarea = textareaRef.current;
+    if (!textarea) return;
+
+    textarea.style.height = "auto";
+    const scrollHeight = input === "" ? 45 : textarea.scrollHeight;
+    const lines = scrollHeight / 45;
+    const newRows = Math.max(1, Math.min(10, Math.floor(lines)));
+
+    textarea.style.height = `${newRows * 45}px`;
+  };
+
+  useEffect(adjustHeight, [input]);
+
+  return (
+    <div className="bg-gray-50 dark:bg-gray-800">
+      <div className="flex p-2 items-end space-x-2 bg-white dark:bg-gray-700 rounded-2 overflow-hidden shadow-inner">
+        {/* <Button
+          variant="ghost"
+          className="rounded-full min-w-10 p-2"
+          onClick={handleVoiceInput}
+        >
+          <Mic size={16} className={transcript ? "text-red-500" : ""} />
+        </Button>     */}
+        <Textarea
+          ref={textareaRef}
+          value={input}
+          onChange={handleInputChange}
+          placeholder={t("typeMessage")!}
+          className={cn(
+            "flex-grow border-none bg-transparent focus:ring-0 focus:outline-none resize-none",
+            "min-h-[2.5rem] py-2 px-3 text-base leading-relaxed",
+            "scrollbar scrollbar-thumb-gray-300 dark:scrollbar-thumb-gray-600",
+            "scrollbar-track-transparent scrollbar-thin hover:scrollbar-thumb-gray-400 dark:hover:scrollbar-thumb-gray-500",
+            "!border-none focus-visible:ring-0 focus-visible:outline-none"
+          )}
+          style={{
+            minHeight: `${MIN_TEXTAREA_HEIGHT}px`,
+            maxHeight: `${MAX_TEXTAREA_HEIGHT}px`,
+            overflowY: "auto",
+            boxSizing: "border-box",
+          }}
+          onKeyPress={(e) => {
+            if (e.key === "Enter" && !e.shiftKey && !isLoading) {
+              e.preventDefault();
+              handleSend();
+            }
+          }}
+        />
+        <Button
+          className="rounded-full min-w-10 p-2"
+          onClick={isLoading ? abortRequest : handleSend}
+        >
+          {isLoading ? (
+            <StopCircle size={16} className="text-red-500" />
+          ) : (
+            <Send size={16} />
+          )}
+        </Button>
+      </div>
+    </div>
+  );
+};
+
+export default BottomInputContainer;
diff --git a/src/components/ExecutionStepComponent.tsx b/src/components/ExecutionStepComponent.tsx
new file mode 100644
index 0000000..58a15bd
--- /dev/null
+++ b/src/components/ExecutionStepComponent.tsx
@@ -0,0 +1,38 @@
+import React from "react";
+import { CheckCircle, XCircle, Clock } from "lucide-react";
+import { ExecutionStep } from "@/type";
+
+const ExecutionStepComponent: React.FC<{ step: ExecutionStep }> = ({
+  step,
+}) => {
+  const getStatusIcon = () => {
+    switch (step.status) {
+      case "success":
+        return <CheckCircle className="text-green-500" />;
+      case "failure":
+        return <XCircle className="text-red-500" />;
+      default:
+        return <Clock className="text-gray-500" />;
+    }
+  };
+
+  return (
+    <div className="border rounded p-2 mb-2">
+      <div className="flex items-center">
+        {getStatusIcon()}
+        <span className="ml-2 font-bold">{step.step}</span>
+      </div>
+      <pre className="bg-gray-100 p-2 mt-2 rounded text-sm overflow-x-auto">
+        <code>{step.code}</code>
+      </pre>
+      {step.result && (
+        <div className="mt-2">
+          <strong>Result:</strong>
+          <p>{step.result}</p>
+        </div>
+      )}
+    </div>
+  );
+};
+
+export default ExecutionStepComponent;
diff --git a/src/components/OsaiApp.tsx b/src/components/OsaiApp.tsx
index 81dba54..74a05b8 100644
--- a/src/components/OsaiApp.tsx
+++ b/src/components/OsaiApp.tsx
@@ -1,113 +1,154 @@
 import React, { useState, useEffect, useRef } from "react";
+import { useAI } from "../hooks/useAI";
+import { useTranslation } from "react-i18next";
+import { Button } from "@/components/ui/button";
+import { Card, CardContent } from "@/components/ui/card";
+import { Avatar, AvatarFallback } from "@/components/ui/avatar";
+import { Alert, AlertDescription } from "@/components/ui/alert";
 import {
-  MessageCircle,
-  Mic,
-  Send,
-  ChevronDown,
   Settings,
   AlertTriangle,
   ChevronRightIcon,
   StopCircle,
+  Send,
 } from "lucide-react";
-import { Button } from "@/components/ui/button";
-import { Card, CardContent } from "@/components/ui/card";
-import { Avatar, AvatarFallback, AvatarImage } from "@/components/ui/avatar";
-import { Alert, AlertDescription } from "@/components/ui/alert";
-import { useAI } from "../hooks/useAI";
-import { useSpeechRecognition } from "../hooks/useSpeechRecognition";
-import { useTranslation } from "react-i18next";
 import SettingsModal from "./SettingsModal";
-import i18n from "i18next";
-import { Textarea } from "./ui/textarea";
-import {
-  MAX_CHARS,
-  MAX_TEXTAREA_HEIGHT,
-  MIN_TEXTAREA_HEIGHT,
-} from "@/utils/constants";
-import { cn } from "@/lib/utils";
-
-interface AIResponse {
-  thought_process: string;
-  plan: string[];
-  user_confirmation_required: boolean;
-  // confirmation_message: string;
-  execution: Array<{
-    step: string;
-    code: string;
-    result: string;
-  }>;
-  response: string;
-}
+import BottomInputContainer from "./BottomInputContainer";
+import { AIResponse, ChatMessage, Message } from "@/type";
+import i18n from "@/utils/i18n";
 
 const OsaiApp = ({
   setIsExpanded,
 }: {
   setIsExpanded: (b: boolean) => void;
 }) => {
-  const [messages, setMessages] = useState<
-    { role: string; content: string; status?: string }[]
-  >([]);
+  const [messages, setMessages] = useState<ChatMessage[]>([]);
+  const latestMessagesRef = useRef<ChatMessage[]>([]);
   const [input, setInput] = useState("");
   const [isSettingsOpen, setIsSettingsOpen] = useState(false);
   const [error, setError] = useState<string | null>(null);
   const { t } = useTranslation();
-  const { sendMessage, isLoading, abortRequest } = useAI();
-  const { startListening, stopListening, transcript } = useSpeechRecognition();
+  const { sendMessage, isLoading, abortRequest, executeCode } = useAI();
   const messageEndRef = useRef<HTMLDivElement>(null);
-  const [pendingConfirmation, setPendingConfirmation] =
-    useState<AIResponse | null>(null);
 
   useEffect(() => {
     messageEndRef.current?.scrollIntoView({ behavior: "smooth" });
   }, [messages]);
-
+  useEffect(() => {
+    latestMessagesRef.current = messages;
+    messageEndRef.current?.scrollIntoView({ behavior: "smooth" });
+  }, [messages]);
   const toggleExpansion = () => setIsExpanded(false);
 
   const handleSend = async () => {
     if (input.trim()) {
-      const userMessage = { role: "user", content: input };
+      const newMessage: ChatMessage = {
+        role: "user",
+        content: [{ type: "text", text: input }],
+      };
       setMessages((prev) => [
         ...prev,
-        userMessage,
-        { role: "assistant", content: "...", status: "loading" },
+        newMessage,
+        {
+          role: "assistant",
+          content: [{ type: "text", text: "..." }],
+          status: "loading",
+        },
       ]);
       setInput("");
       setError("");
       try {
-        const aiResponse: AIResponse = await sendMessage(input);
-        setMessages((prev) => prev.slice(0, -1)); // Remove loading message
-        if (aiResponse.user_confirmation_required) {
-          setPendingConfirmation(aiResponse);
-        } else {
-          setMessages((prev) => [
-            ...prev,
-            { role: "assistant", content: aiResponse.response },
-          ]);
-        }
+        const aiResponse: AIResponse = await sendMessage([
+          ...messages,
+          newMessage,
+        ]);
+        const newAssistantMessage: ChatMessage = {
+          role: "assistant",
+          content: [{ type: "text", text: aiResponse.response }],
+          aiResponse,
+          status: "complete",
+          executionStatus: aiResponse.user_confirmation_required
+            ? "pending"
+            : "executing",
+        };
+        setMessages((prev) => {
+          const updatedMessages = [...prev.slice(0, -1), newAssistantMessage];
+          latestMessagesRef.current = updatedMessages;
+          if (!aiResponse.user_confirmation_required) {
+            executeAIResponse(updatedMessages.length - 1);
+          }
+          return updatedMessages;
+        });
       } catch (error: any) {
-        setMessages((prev) => prev.slice(0, -2)); // Remove both loading and user message
-        setInput(userMessage.content); // Restore input
-        if (error.message.includes("Open settings and set the API key")) {
-          setError(t("lackApiKey")!);
-        } else if (error.message === "requestAborted") {
-          setError(t("requestAborted")!);
-        } else {
-          setError(t("aiResponseError")!);
-        }
+        setMessages((prev) => prev.slice(0, -2));
+        setInput(newMessage.content[0].text);
+        setError(
+          error.message.includes("Open settings and set the API key")
+            ? t("lackApiKey")!
+            : t("aiResponseError")!
+        );
         console.error("Error getting AI response:", error);
       }
     }
   };
 
-  const handleConfirmation = (confirmed: boolean) => {
-    if (pendingConfirmation) {
-      if (confirmed) {
-        setMessages((prev) => [
-          ...prev,
-          { role: "assistant", content: pendingConfirmation.response },
-        ]);
+  const executeAIResponse = async (messageIndex: number) => {
+    const message = messages[messageIndex];
+    if (message.aiResponse && message.aiResponse.should_execute_code) {
+      setMessages((prev) => {
+        const newMessages = [...prev];
+        newMessages[messageIndex] = {
+          ...message,
+          executionStatus: "executing",
+        };
+        return newMessages;
+      });
+
+      for (const step of message.aiResponse.execution) {
+        if (!step.code) continue;
+        const result = await executeCode(step.code);
+        setMessages((prev) => {
+          const newMessages = [...prev];
+          const executionSteps =
+            newMessages[messageIndex].aiResponse!.execution;
+          const stepIndex = executionSteps.findIndex(
+            (s) => s.step === step.step
+          );
+          executionSteps[stepIndex] = {
+            ...step,
+            status: result.success ? "success" : "failure",
+            result: result.output,
+          };
+          return newMessages;
+        });
       }
-      setPendingConfirmation(null);
+
+      setMessages((prev) => {
+        const newMessages = [...prev];
+        newMessages[messageIndex] = {
+          ...message,
+          executionStatus: "complete",
+        };
+        return newMessages;
+      });
+    }
+  };
+
+  const handleConfirmation = async (
+    messageIndex: number,
+    confirmed: boolean
+  ) => {
+    setMessages((prev) => {
+      const newMessages = [...prev];
+      newMessages[messageIndex] = {
+        ...newMessages[messageIndex],
+        executionStatus: confirmed ? "executing" : "rejected",
+      };
+      return newMessages;
+    });
+
+    if (confirmed) {
+      await executeAIResponse(messageIndex);
     }
   };
 
@@ -116,95 +157,102 @@ const OsaiApp = ({
       <div className="fixed bottom-4 right-4 transition-all duration-300 ease-in-out w-96 h-[32rem]">
         <Card className="w-full h-full overflow-hidden shadow-lg">
           <CardContent className="flex flex-col h-full p-0">
-            <>
-              <div className="flex justify-between items-center p-2 border-b bg-gray-50 dark:bg-gray-800">
-                <h2 className="text-lg font-bold">Osai</h2>
-                <div className="flex space-x-2">
-                  <Button
-                    variant="ghost"
-                    size="sm"
-                    onClick={() =>
-                      i18n.changeLanguage(i18n.language === "en" ? "zh" : "en")
-                    }
-                  >
-                    {i18n.language === "en" ? "EN" : "中文"}
-                  </Button>
-                  <Button
-                    variant="ghost"
-                    size="sm"
-                    onClick={() => setIsSettingsOpen(true)}
-                  >
-                    <Settings size={16} />
-                  </Button>
-                  <Button variant="ghost" size="sm" onClick={toggleExpansion}>
-                    <ChevronRightIcon size={16} />
-                  </Button>
-                </div>
+            <div className="flex justify-between items-center p-2 border-b bg-gray-50 dark:bg-gray-800">
+              <h2 className="text-lg font-bold">Osai</h2>
+              <div className="flex space-x-2">
+                <Button
+                  variant="ghost"
+                  size="sm"
+                  onClick={() =>
+                    i18n.changeLanguage(i18n.language === "en" ? "zh" : "en")
+                  }
+                >
+                  {i18n.language === "en" ? "EN" : "中文"}
+                </Button>
+                <Button
+                  variant="ghost"
+                  size="sm"
+                  onClick={() => setIsSettingsOpen(true)}
+                >
+                  <Settings size={16} />
+                </Button>
+                <Button variant="ghost" size="sm" onClick={toggleExpansion}>
+                  <ChevronRightIcon size={16} />
+                </Button>
               </div>
-
-              <div className="flex-grow overflow-y-auto p-4 space-y-4">
-                {error && (
-                  <Alert variant="destructive">
-                    <AlertTriangle className="h-4 w-4" />
-                    <AlertDescription>{error}</AlertDescription>
-                  </Alert>
-                )}
-                {messages.map((msg, index) => (
+            </div>
+            <div className="flex-grow overflow-y-auto p-4 space-y-4">
+              {error && (
+                <Alert variant="destructive">
+                  <AlertTriangle className="h-4 w-4" />
+                  <AlertDescription>{error}</AlertDescription>
+                </Alert>
+              )}
+              {messages.map((msg, index) => (
+                <div
+                  key={index}
+                  className={`flex ${
+                    msg.role === "user" ? "justify-end" : "justify-start"
+                  }`}
+                >
                   <div
-                    key={index}
                     className={`flex ${
-                      msg.role === "user" ? "justify-end" : "justify-start"
-                    }`}
+                      msg.role === "user" ? "flex-row-reverse" : "flex-row"
+                    } items-end space-x-2 w-full`}
                   >
+                    <Avatar
+                      className={`w-8 h-8 ${
+                        msg.role === "user" ? "ml-2" : "mr-2"
+                      }`}
+                    >
+                      <AvatarFallback>
+                        {msg.role === "user" ? "U" : "AI"}
+                      </AvatarFallback>
+                    </Avatar>
                     <div
-                      className={`flex ${
-                        msg.role === "user" ? "flex-row-reverse" : "flex-row"
-                      } items-end space-x-2 w-full`}
+                      className={`max-w-[70%] p-3 rounded-lg ${
+                        msg.role === "user"
+                          ? "bg-blue-500 text-white"
+                          : "bg-gray-200 dark:bg-gray-700 text-black dark:text-white"
+                      }`}
                     >
-                      <Avatar
-                        className={`w-8 h-8 ${
-                          msg.role === "user" ? "ml-2" : "mr-2"
-                        }`}
-                      >
-                        <AvatarFallback>
-                          {msg.role === "user" ? "U" : "AI"}
-                        </AvatarFallback>
-                      </Avatar>
-                      <div
-                        className={`max-w-[70%] p-3 rounded-lg ${
-                          msg.role === "user"
-                            ? "bg-blue-500 text-white"
-                            : "bg-gray-200 dark:bg-gray-700 text-black dark:text-white"
-                        }`}
-                      >
-                        {msg.status === "loading" ? "..." : msg.content}
-                      </div>
+                      {msg.status === "loading" ? "..." : msg.content[0].text}
                     </div>
                   </div>
-                ))}
-                {pendingConfirmation && (
-                  <div className="flex justify-center space-x-2">
-                    <Button onClick={() => handleConfirmation(true)}>
-                      {t("approve")}
-                    </Button>
-                    <Button onClick={() => handleConfirmation(false)}>
-                      {t("reject")}
-                    </Button>
-                  </div>
-                )}
-                <div ref={messageEndRef} />
-              </div>
+                  {msg.aiResponse?.user_confirmation_required &&
+                    msg.executionStatus === "pending" && (
+                      <div className="flex justify-center space-x-2 mt-2">
+                        <Button onClick={() => handleConfirmation(index, true)}>
+                          {t("approve")}
+                        </Button>
+                        <Button
+                          onClick={() => handleConfirmation(index, false)}
+                        >
+                          {t("reject")}
+                        </Button>
+                      </div>
+                    )}
+                  {/* {msg.aiResponse?.execution && (
+                    <div className="mt-2">
+                      {msg.aiResponse.execution
+                        .filter((step) => !!step.code)
+                        .map((step, stepIndex) => (
+                          <ExecutionStepComponent key={stepIndex} step={step} />
+                        ))}
+                    </div>
+                  )} */}
+                </div>
+              ))}
+              <div ref={messageEndRef} />
+            </div>
 
-              <BottomInputContainer
-                input={input}
-                isLoading={isLoading}
-                startListening={startListening}
-                stopListening={stopListening}
-                handleSend={handleSend}
-                setInput={setInput}
-                abortRequest={abortRequest}
-              />
-            </>
+            <BottomInputContainer
+              input={input}
+              isLoading={isLoading}
+              handleSend={handleSend}
+              setInput={setInput}
+              abortRequest={abortRequest}
+            />
           </CardContent>
         </Card>
       </div>
@@ -216,104 +264,4 @@ const OsaiApp = ({
   );
 };
 
-const BottomInputContainer = ({
-  isLoading,
-  input,
-  stopListening,
-  startListening,
-  handleSend,
-  setInput,
-  abortRequest,
-}: {
-  input: string;
-  isLoading: boolean;
-  stopListening: () => void;
-  startListening: () => void;
-  handleSend: () => void;
-  setInput: (s: string) => void;
-  abortRequest: () => void;
-}) => {
-  const { t } = useTranslation();
-  const { transcript } = useSpeechRecognition();
-  const textareaRef = useRef<HTMLTextAreaElement>(null);
-
-  const handleVoiceInput = () => {
-    if (transcript) {
-      stopListening();
-    } else {
-      startListening();
-    }
-  };
-
-  const handleInputChange = (e: React.ChangeEvent<HTMLTextAreaElement>) => {
-    const value = e.target.value;
-    if (value.length <= MAX_CHARS) {
-      setInput(value);
-    }
-  };
-
-  const adjustHeight = () => {
-    const textarea = textareaRef.current;
-    if (!textarea) return;
-
-    textarea.style.height = "auto";
-    const scrollHeight = input === "" ? 45 : textarea.scrollHeight;
-    const lines = scrollHeight / 45;
-    const newRows = Math.max(1, Math.min(10, Math.floor(lines)));
-
-    textarea.style.height = `${newRows * 45}px`;
-  };
-
-  useEffect(adjustHeight, [input]);
-
-  return (
-    <div className="bg-gray-50 dark:bg-gray-800">
-      <div className="flex p-2 items-end space-x-2 bg-white dark:bg-gray-700 rounded-2 overflow-hidden shadow-inner">
-        <Button
-          variant="ghost"
-          className="rounded-full min-w-10 p-2"
-          onClick={handleVoiceInput}
-        >
-          <Mic size={16} className={transcript ? "text-red-500" : ""} />
-        </Button>
-        <Textarea
-          ref={textareaRef}
-          value={input}
-          onChange={handleInputChange}
-          placeholder={t("typeMessage")!}
-          className={cn(
-            "flex-grow border-none bg-transparent focus:ring-0 focus:outline-none resize-none",
-            "min-h-[2.5rem] py-2 px-3 text-base leading-relaxed",
-            "scrollbar scrollbar-thumb-gray-300 dark:scrollbar-thumb-gray-600",
-            "scrollbar-track-transparent scrollbar-thin hover:scrollbar-thumb-gray-400 dark:hover:scrollbar-thumb-gray-500",
-            "!border-none focus-visible:ring-0 focus-visible:outline-none"
-          )}
-          style={{
-            minHeight: `${MIN_TEXTAREA_HEIGHT}px`,
-            maxHeight: `${MAX_TEXTAREA_HEIGHT}px`,
-            overflowY: "auto",
-            boxSizing: "border-box",
-          }}
-          onKeyPress={(e) => {
-            if (e.key === "Enter" && !e.shiftKey) {
-              e.preventDefault();
-              handleSend();
-            }
-          }}
-        />
-        <Button
-          className="rounded-full min-w-10 p-2"
-          onClick={isLoading ? abortRequest : handleSend}
-        >
-          {isLoading ? (
-            <StopCircle size={16} className="text-red-500" />
-          ) : (
-            <Send size={16} />
-          )}
-        </Button>
-      </div>
-    </div>
-  );
-};
-
 export default OsaiApp;
diff --git a/src/components/SettingsModal.tsx b/src/components/SettingsModal.tsx
index fbaf85e..5556f3f 100644
--- a/src/components/SettingsModal.tsx
+++ b/src/components/SettingsModal.tsx
@@ -143,7 +143,7 @@ const SettingsModal = ({
                       e.target.value
                     )
                   }
-                  placeholder={t("enterApiKey")}
+                  placeholder={t("enterApiKey")!}
                   className="flex-grow"
                 />
                 <button
diff --git a/src/components/SideDrawer .tsx b/src/components/SideDrawer .tsx
index c46bb59..7c2dd0f 100644
--- a/src/components/SideDrawer .tsx	
+++ b/src/components/SideDrawer .tsx	
@@ -14,7 +14,7 @@ const SideDrawer = () => {
       if (isExpanded) {
         await appWindow.setSize(new PhysicalSize(400, 528));
         await appWindow.setPosition(
-          new PhysicalPosition(screenWidth - 400, screenHeight * 0.4)
+          new PhysicalPosition(screenWidth - 380, screenHeight * 0.4)
         );
       } else {
         await appWindow.setSize(new PhysicalSize(40, 24));
diff --git a/src/config/aiProviders.ts b/src/config/aiProviders.ts
index 49212af..f073ba5 100644
--- a/src/config/aiProviders.ts
+++ b/src/config/aiProviders.ts
@@ -24,6 +24,7 @@ export interface AIResponse {
   thought_process: string;
   plan: string[];
   user_confirmation_required: boolean;
+  should_execute_code: boolean;
   // confirmation_message: string;
   execution: Array<{
     step: string;
@@ -35,33 +36,70 @@ export interface AIResponse {
 
 const tools: Anthropic.Messages.Tool[] = [
   {
-    name: "format_response",
+    name: "os_ai_assistant",
     description:
-      "Format the AI's response into a specific JSON structure. This structure includes the AI's thought process, action plan, execution details, and final response. It also indicates whether user confirmation is required and provides a confirmation message if needed. This formatted response ensures consistent and structured communication between the AI system and the user interface.",
+      "An AI assistant for executing operating system tasks and answering queries",
     input_schema: {
       type: "object",
       properties: {
-        thought_process: { type: "string" },
-        plan: { type: "array", items: { type: "string" } },
-        user_confirmation_required: { type: "boolean" },
-        // confirmation_message: { type: "string" },
+        thought_process: {
+          type: "string",
+          description: "The AI's reasoning process for the given input",
+        },
+        plan: {
+          type: "array",
+          items: {
+            type: "string",
+          },
+          description:
+            "A list of minimal, atomic steps planned to complete the task",
+        },
+        user_confirmation_required: {
+          type: "boolean",
+          description:
+            "True only if the task involves system modifications or accessing sensitive data",
+        },
+        should_execute_code: {
+          type: "boolean",
+          description:
+            "True if the task requires executing system commands or browser actions",
+        },
         execution: {
           type: "array",
           items: {
             type: "object",
             properties: {
-              step: { type: "string" },
-              code: { type: "string" },
-              result: { type: "string" },
+              step: {
+                type: "string",
+                description: "Description of the execution step",
+              },
+              code: {
+                type: "string",
+                description:
+                  "The actual system command to be executed, or an empty string if not applicable",
+              },
+              result: {
+                type: "string",
+                description:
+                  "The expected or actual result of the execution step",
+              },
             },
+            required: ["step", "code", "result"],
           },
+          description:
+            "Detailed execution steps including only steps that require code execution",
+        },
+        response: {
+          type: "string",
+          description:
+            "The final response to the user, including results or next steps, without inventing information",
         },
-        response: { type: "string" },
       },
       required: [
         "thought_process",
         "plan",
         "user_confirmation_required",
+        "should_execute_code",
         "execution",
         "response",
       ],
@@ -100,8 +138,9 @@ const sendMessageToAnthropic = async ({
   };
   console.log(`Sending message to Claude:`, invokeParams);
   const response = await invoke("send_message_to_anthropic", invokeParams);
-  console.log(`Response from Claude:`, response);
-  return response.data as AIResponse;
+  const res = JSON.parse(response);
+  console.log(`Response from Claude:`, res);
+  return res.content[res.content.length - 1].input as AIResponse;
 
   // return JSON.parse(response.content[0].text) as AIResponse;
 };
diff --git a/src/hooks/useAI.ts b/src/hooks/useAI.ts
index b0f722a..e5270f0 100644
--- a/src/hooks/useAI.ts
+++ b/src/hooks/useAI.ts
@@ -4,6 +4,7 @@ import axios from "axios";
 import { AIResponse, OsaiError, aiProviders } from "../config/aiProviders";
 import { useSettings } from "./useSettings";
 import { invoke } from "@tauri-apps/api";
+import { Message } from "@/type";
 
 export const useAI = () => {
   const [isLoading, setIsLoading] = useState(false);
@@ -12,10 +13,7 @@ export const useAI = () => {
   const cancelFlagRef = useRef<any>(null);
 
   const sendMessage = useCallback(
-    async (
-      input: string,
-      providerName: string = "Claude"
-    ): Promise<AIResponse> => {
+    async (messages: Message[]): Promise<AIResponse> => {
       setIsLoading(true);
 
       try {
@@ -23,12 +21,12 @@ export const useAI = () => {
           (p) => p.name === settings.AI_PROVIDER
         );
         if (!provider) {
-          throw new Error(`AI provider ${providerName} not found`);
+          throw new Error(`AI provider ${settings.AI_PROVIDER} not found`);
         }
         const apiKey = settings[`${settings.AI_PROVIDER}_API_KEY`];
         if (!apiKey) {
           throw new Error(
-            `API key for ${providerName} not set, Open settings and set the API key`
+            `API key for ${settings.AI_PROVIDER} not set, Open settings and set the API key`
           );
         }
         cancelFlagRef.current = await invoke("create_cancel_flag");
@@ -37,16 +35,14 @@ export const useAI = () => {
           model: settings.AI_MODEL,
           apiKey,
           flagId: cancelFlagRef.current,
-          messages: [
-            {
-              role: "user",
-              content: input,
-            },
-          ],
+          messages: messages,
         });
         return response;
       } catch (error) {
-        console.error(`Error sending message to ${providerName}:`, error);
+        console.error(
+          `Error sending message to ${settings.AI_PROVIDER}:`,
+          error
+        );
         const osaiError = error as OsaiError;
         if (
           osaiError.message?.includes("API key for") ||
@@ -71,12 +67,24 @@ export const useAI = () => {
     },
     [settings, t]
   );
+  const executeCode = useCallback(
+    async (code: string): Promise<{ success: boolean; output: string }> => {
+      try {
+        const result: string = await invoke("execute_code", { code });
+        return { success: true, output: result };
+      } catch (error: any) {
+        console.error("Error executing code:", error);
+        return { success: false, output: error.toString() };
+      }
+    },
+    []
+  );
   const abortRequest = useCallback(async () => {
     if (cancelFlagRef.current) {
-      await invoke("cancel_request", { cancelFlag: cancelFlagRef.current });
+      await invoke("cancel_request", { flagId: cancelFlagRef.current });
       cancelFlagRef.current = null;
       setIsLoading(false);
     }
   }, []);
-  return { sendMessage, isLoading, abortRequest };
+  return { sendMessage, isLoading, abortRequest, executeCode };
 };
diff --git a/src/type.ts b/src/type.ts
new file mode 100644
index 0000000..26feb89
--- /dev/null
+++ b/src/type.ts
@@ -0,0 +1,31 @@
+export interface MessageContent {
+  type: "text";
+  text: string;
+}
+
+export interface Message {
+  role: "user" | "assistant";
+  content: MessageContent[];
+}
+
+export interface AIResponse {
+  thought_process: string;
+  plan: string[];
+  user_confirmation_required: boolean;
+  should_execute_code: boolean;
+  execution: ExecutionStep[];
+  response: string;
+}
+
+export interface ExecutionStep {
+  step: string;
+  code: string;
+  result: string;
+  status?: "pending" | "success" | "failure";
+}
+
+export interface ChatMessage extends Message {
+  status?: "loading" | "complete";
+  aiResponse?: AIResponse;
+  executionStatus?: "pending" | "executing" | "complete" | "rejected";
+}