google-ai-edge
diff --git a/‎c/engine.cc‎
Lines changed: 7 additions & 17 deletions b/‎c/engine.cc‎
Lines changed: 7 additions & 17 deletions
diff --git a/‎docs/api/cpp/conversation.md‎
Lines changed: 14 additions & 16 deletions b/‎docs/api/cpp/conversation.md‎
Lines changed: 14 additions & 16 deletions
diff --git a/‎docs/api/cpp/tool-use.md‎
Lines changed: 37 additions & 50 deletions b/‎docs/api/cpp/tool-use.md‎
Lines changed: 37 additions & 50 deletions
diff --git a/‎kotlin/java/com/google/ai/edge/litertlm/jni/litertlm.cc‎
Lines changed: 17 additions & 36 deletions b/‎kotlin/java/com/google/ai/edge/litertlm/jni/litertlm.cc‎
Lines changed: 17 additions & 36 deletions
@@ -75,17 +75,12 @@ CreateConversationCallback(LiteRtLmStreamCallback callback, void* user_data) {
       callback(user_data, nullptr, true, const_cast<char*>(error_str.c_str()));
       return;
     }
-    if (auto* json_msg = std::get_if<litert::lm::JsonMessage>(&*message)) {
-      if (json_msg->is_null()) {  // End of stream marker
-        callback(user_data, nullptr, true, nullptr);
-      } else {
-        std::string json_str = json_msg->dump();
-        callback(user_data, const_cast<char*>(json_str.c_str()), false,
-                 nullptr);
-      }
+    if (message->empty()) {  // End of stream marker
+      callback(user_data, nullptr, true, nullptr);
     } else {
-      std::string error_str = "Unsupported message type";
-      callback(user_data, nullptr, true, const_cast<char*>(error_str.c_str()));
+      std::string json_str = message->dump();
+      callback(user_data, const_cast<char*>(json_str.c_str()), false,
+               nullptr);
     }
   };
 }
@@ -110,7 +105,7 @@ using ::litert::lm::Engine;
 using ::litert::lm::EngineFactory;
 using ::litert::lm::EngineSettings;
 using ::litert::lm::InputText;
-using ::litert::lm::JsonMessage;
+
 using ::litert::lm::Message;
 using ::litert::lm::ModelAssets;
 using ::litert::lm::Responses;
@@ -712,13 +707,8 @@ LiteRtLmJsonResponse* litert_lm_conversation_send_message(
     ABSL_LOG(ERROR) << "Failed to send message: " << response.status();
     return nullptr;
   }
-  auto* json_response = std::get_if<JsonMessage>(&*response);
-  if (!json_response) {
-    ABSL_LOG(ERROR) << "Response is not a JSON message.";
-    return nullptr;
-  }
   auto* c_response = new LiteRtLmJsonResponse;
-  c_response->json_string = json_response->dump();
+  c_response->json_string = response->dump();
   return c_response;
 }
 
 
@@ -58,7 +58,7 @@ CHECK_OK(conversation);
 
 // 4. Send message to the LLM with blocking call.
 absl::StatusOr<Message> model_message = (*conversation)->SendMessage(
-    JsonMessage{
+    Message{
         {"role", "user"},
         {"content", "What is the tallest building in the world?"}
     });
@@ -72,7 +72,7 @@ std::cout << *model_message << std::endl;
 // process the message once a chunk of message output is received.
 std::stringstream captured_output;
 (*conversation)->SendMessageAsync(
-    JsonMessage{
+    Message{
         {"role", "user"},
         {"content", "What is the tallest building in the world?"}
     },
@@ -97,18 +97,16 @@ absl::AnyInvocable<void(absl::StatusOr<Message>)> CreatePrintMessageCallback(
       std::cout << message.status().message() << std::endl;
       return;
     }
-    if (auto json_message = std::get_if<JsonMessage>(&(*message))) {
-      if (json_message->is_null()) {
-        std::cout << std::endl << std::flush;
-        return;
-      }
-      ABSL_CHECK_OK(PrintJsonMessage(*json_message, captured_output,
-                                     /*streaming=*/true));
+    if (message->empty()) {
+      std::cout << std::endl << std::flush;
+      return;
     }
+    ABSL_CHECK_OK(PrintMessage(*message, captured_output,
+                               /*streaming=*/true));
   };
 }
 
-absl::Status PrintJsonMessage(const JsonMessage& message,
+absl::Status PrintMessage(const Message& message,
                               std::stringstream& captured_output,
                               bool streaming = false) {
   if (message["content"].is_array()) {
@@ -162,7 +160,7 @@ auto engine_settings = EngineSettings::CreateDefault(
 
 // Send message to the LLM with image data.
 absl::StatusOr<Message> model_message = (*conversation)->SendMessage(
-    JsonMessage{
+    Message{
         {"role", "user"},
         {"content", { // Now content must be an array.
           {{"type", "text"}, {"text", "Describe the following image: "}},
@@ -176,7 +174,7 @@ std::cout << *model_message << std::endl;
 
 // Send message to the LLM with audio data.
 model_message = (*conversation)->SendMessage(
-    JsonMessage{
+    Message{
         {"role", "user"},
         {"content", { // Now content must be an array.
           {{"type", "text"}, {"text", "Transcribe the audio: "}},
@@ -190,7 +188,7 @@ std::cout << *model_message << std::endl;
 
 // The content can include multiple image or audio data.
 model_message = (*conversation)->SendMessage(
-    JsonMessage{
+    Message{
         {"role", "user"},
         {"content", { // Now content must be an array.
           {{"type", "text"}, {"text", "First briefly describe the two images "}},
@@ -223,7 +221,7 @@ data to Session.
 
 The core input and output format for the Conversation API is
 [`Message`][Message]. Currently, this is implemented as
-[`JsonMessage`][JsonMessage], which is a type alias for
+[`Message`][Message], which is a type alias for
 [`ordered_json`][ordered_json], a flexible nested key-value data structure.
 
 The [`Conversation`][Conversation] API operates on a message-in-message-out
@@ -492,7 +490,7 @@ This function is triggered under the following conditions:
 *   When a new chunk of the [`Message`][Message] is received from the Model.
 *   If an error occurs during LiteRT-LM's message processing.
 *   Upon completion of the LLM's inference, the callback is triggered with an
-    empty [`Message`][Message] (e.g., `JsonMessage()`) to signal the end of the
+    empty [`Message`][Message] (e.g., `Message()`) to signal the end of the
     response.
 
 Refer to the [Step 6 asynchronous call](#text-only-content) for an example
@@ -584,7 +582,7 @@ the asynchronous call is complete.
 [Jinja]: https://jinja.palletsprojects.com/en/stable/ "jinja prompt template"
 [PromptTemplate]: https://github.com/google-ai-edge/LiteRT-LM/blob/main/runtime/components/prompt_template.h "litert::lm::PromptTemplate"
 [message]: https://github.com/google-ai-edge/LiteRT-LM/blob/63f7dec93ac85560e64194a00b5d7c407de40846/runtime/conversation/io_types.h#L28 "litert::lm::Message"
-[jsonmessage]: https://github.com/google-ai-edge/LiteRT-LM/blob/63f7dec93ac85560e64194a00b5d7c407de40846/runtime/conversation/io_types.h#L25 "litert::lm::JsonMessage"
+
 [ordered_json]: https://json.nlohmann.me/api/ordered_json/ "ordered_json"
 [preface]: https://github.com/google-ai-edge/LiteRT-LM/blob/63f7dec93ac85560e64194a00b5d7c407de40846/runtime/conversation/io_types.h#L48 "litert::lm::Preface"
 [ConversationConfig]: https://github.com/google-ai-edge/LiteRT-LM/blob/63f7dec93ac85560e64194a00b5d7c407de40846/runtime/conversation/conversation.h#L44 "litert::lm::ConversationConfig"
 
@@ -143,7 +143,7 @@ Example:
 
 ```c++
 // Construct the user message as a JSON object.
-JsonMessage user_message = JsonMessage::parse(R"({
+Message user_message = Message::parse(R"({
   "role": "user",
   "content": {
     "type": "text",
@@ -234,7 +234,7 @@ know the result. Pass the tool result as a message with the `role` set to
 
 ```c++
 // Construct the tool message containing the result.
-JsonMessage tool_message = {{"role", "tool"}, {"content", weather_report}};
+Message tool_message = {{"role", "tool"}, {"content", weather_report}};
 
 // Send the tool message to the model.
 ASSIGN_OR_RETURN(model_message, conversation->SendMessage(tool_message));
@@ -362,7 +362,7 @@ while (true) {
   }
 
   // Construct the user message.
-  JsonMessage input_message = {
+  Message input_message = {
       {"role", "user"},
       {"content", {{{"type", "text"}, {"text", input_prompt}}}}};
 
@@ -372,41 +372,35 @@ while (true) {
     ASSIGN_OR_RETURN(Message message,
                       conversation->SendMessage(input_message));
 
-    // Get the JSON message from the model's response.
-    if (std::holds_alternative<json>(message)) {
-      JsonMessage message_json =
-          std::get<nlohmann::ordered_json>(message);
-
-      // Check for tool calls.
-      if (message_json.contains("tool_calls") &&
-          message_json["tool_calls"].is_array() &&
-          !message_json["tool_calls"].empty()) {
-        // This JSON array will hold the tool response messages.
-        nlohmann::ordered_json tool_messages = nlohmann::ordered_json::array();
-
-        // For each tool call, call the tool and add the response.
-        for (const auto& tool_call : message_json["tool_calls"]) {
-          JsonMessage tool_message = {{"role", "tool"},
-                                                  {"content", {}}};
-          const nlohmann::ordered_json& function = tool_call["function"];
-          tool_message["content"] =
-              tools.CallTool(function["name"], function["arguments"]);
-          tool_messages.push_back(tool_message);
-        }
+    // Check for tool calls.
+    if (message.contains("tool_calls") &&
+        message["tool_calls"].is_array() &&
+        !message["tool_calls"].empty()) {
+      // This JSON array will hold the tool response messages.
+      nlohmann::ordered_json tool_messages = nlohmann::ordered_json::array();
+
+      // For each tool call, call the tool and add the response.
+      for (const auto& tool_call : message["tool_calls"]) {
+        Message tool_message = {{"role", "tool"},
+                                                {"content", {}}};
+        const nlohmann::ordered_json& function = tool_call["function"];
+        tool_message["content"] =
+            tools.CallTool(function["name"], function["arguments"]);
+        tool_messages.push_back(tool_message);
+      }
 
-        // The next input message is the tool response.
-        input_message = tool_messages;
-      } else {
-        // If there are no tool calls, print the model's response and exit the
-        // tool calling loop.
-        for (const auto& item : message_json["content"]) {
-          if (item.contains("type") && item["type"] == "text") {
-            std::cout << item["text"].get<std::string>() << std::endl;
-          }
+      // The next input message is the tool response.
+      input_message = tool_messages;
+    } else {
+      // If there are no tool calls, print the model's response and exit the
+      // tool calling loop.
+      for (const auto& item : message["content"]) {
+        if (item.contains("type") && item["type"] == "text") {
+          std::cout << item["text"].get<std::string>() << std::endl;
         }
-
-        break;
       }
+
+      break;
     }
   }
 }
@@ -449,35 +443,28 @@ while (true) {
       return;
     }
 
-    if (!std::holds_alternative<nlohmann::json>(*message)) {
-      return;
-    }
-
-    // Get JSON from the message.
-    JsonMessage message_json = std::get<JsonMessage>(*message);
-
     // An empty message indicates the model is done generating.
-    if (message_json.is_null()) {
+    if (message->empty()) {
       std::cout << std::endl << std::flush;
       done.Notify();
       return;
     }
 
     // Print any text content.
-    if (message_json.contains("content") &&
-        message_json["content"].is_array()) {
-      for (const auto& item : message_json["content"]) {
+    if (message->contains("content") &&
+        (*message)["content"].is_array()) {
+      for (const auto& item : (*message)["content"]) {
         if (item.contains("text")) {
           std::cout << item["text"] << std::endl << std::flush;
         }
       }
     }
 
     // Collect any tool calls, if present.
-    if (message_json.contains("tool_calls") &&
-        message_json["tool_calls"].is_array() &&
-        !message_json["tool_calls"].empty()) {
-      for (const auto& tool_call : message_json["tool_calls"]) {
+    if (message->contains("tool_calls") &&
+        (*message)["tool_calls"].is_array() &&
+        !(*message)["tool_calls"].empty()) {
+      for (const auto& tool_call : (*message)["tool_calls"]) {
         tool_calls.push_back(tool_call);
       }
     }
 
@@ -69,7 +69,7 @@ using litert::lm::InputAudio;
 using litert::lm::InputData;
 using litert::lm::InputImage;
 using litert::lm::InputText;
-using litert::lm::JsonMessage;
+
 using litert::lm::JsonPreface;
 using litert::lm::Message;
 using litert::lm::ModelAssets;
@@ -939,8 +939,8 @@ LITERTLM_JNIEXPORT void JNICALL JNI_METHOD(nativeSendMessageAsync)(
       reinterpret_cast<Conversation*>(conversation_pointer);
 
   const char* json_chars = env->GetStringUTFChars(messageJSONString, nullptr);
-  litert::lm::JsonMessage json_message =
-      nlohmann::ordered_json::parse(json_chars);
+  litert::lm::Message message =
+      Message(nlohmann::ordered_json::parse(json_chars));
   env->ReleaseStringUTFChars(messageJSONString, json_chars);
 
   litert::lm::OptionalArgs optional_args;
@@ -996,27 +996,16 @@ LITERTLM_JNIEXPORT void JNICALL JNI_METHOD(nativeSendMessageAsync)(
         };
 
         if (message.ok()) {
-          if (!std::holds_alternative<litert::lm::JsonMessage>(*message)) {
-            ABSL_LOG(WARNING) << "Receive callback OnError: Not a JsonMessage";
-            jstring err_message =
-                env->NewStringUTF("Response is not a JsonMessage");
-            env->CallVoidMethod(callback_global, on_error_mid,
-                                (jint)absl::StatusCode::kInternal, err_message);
-            env->DeleteLocalRef(err_message);
+          if (message->empty()) {
+            // Null/empty message indicates completion.
+            env->CallVoidMethod(callback_global, on_complete_mid);
             on_done_fn();
           } else {
-            auto json_message = std::get<litert::lm::JsonMessage>(*message);
-            if (json_message.is_null()) {
-              // Null message indicates completion.
-              env->CallVoidMethod(callback_global, on_complete_mid);
-              on_done_fn();
-            } else {
-              std::string message_str = json_message.dump();
-              jstring message_jstr = NewStringStandardUTF(env, message_str);
-              env->CallVoidMethod(callback_global, on_message_mid,
-                                  message_jstr);
-              env->DeleteLocalRef(message_jstr);
-            }
+            std::string message_str = message->dump();
+            jstring message_jstr = NewStringStandardUTF(env, message_str);
+            env->CallVoidMethod(callback_global, on_message_mid,
+                                message_jstr);
+            env->DeleteLocalRef(message_jstr);
           }
         } else {
           ABSL_LOG(WARNING) << "Receive callback OnError: " << message.status();
@@ -1033,8 +1022,8 @@ LITERTLM_JNIEXPORT void JNICALL JNI_METHOD(nativeSendMessageAsync)(
         }
       };
 
-  auto status = conversation->SendMessageAsync(
-      json_message, std::move(callback_fn), std::move(optional_args));
+  auto status = conversation->SendMessageAsync(message, std::move(callback_fn),
+                                               std::move(optional_args));
 
   if (!status.ok()) {
     ThrowLiteRtLmJniException(
@@ -1049,8 +1038,8 @@ LITERTLM_JNIEXPORT jstring JNICALL JNI_METHOD(nativeSendMessage)(
       reinterpret_cast<Conversation*>(conversation_pointer);
 
   const char* json_chars = env->GetStringUTFChars(messageJSONString, nullptr);
-  litert::lm::JsonMessage json_message =
-      nlohmann::ordered_json::parse(json_chars);
+  litert::lm::Message message =
+      Message(nlohmann::ordered_json::parse(json_chars));
   env->ReleaseStringUTFChars(messageJSONString, json_chars);
 
   litert::lm::OptionalArgs optional_args;
@@ -1060,22 +1049,14 @@ LITERTLM_JNIEXPORT jstring JNICALL JNI_METHOD(nativeSendMessage)(
     optional_args.extra_context = extra_context;
   }
 
-  auto response =
-      conversation->SendMessage(json_message, std::move(optional_args));
+  auto response = conversation->SendMessage(message, std::move(optional_args));
   if (!response.ok()) {
     ThrowLiteRtLmJniException(env, "Failed to call nativeSendMessage: " +
                                        response.status().ToString());
     return nullptr;
   }
 
-  if (!std::holds_alternative<litert::lm::JsonMessage>(*response)) {
-    ThrowLiteRtLmJniException(
-        env, "Failed to call nativeSendMessage: Response is not a JsonMessage");
-    return nullptr;
-  }
-
-  auto json_response = std::get<litert::lm::JsonMessage>(*response);
-  return NewStringStandardUTF(env, json_response.dump());
+  return NewStringStandardUTF(env, response->dump());
 }
 
 LITERTLM_JNIEXPORT void JNICALL JNI_METHOD(nativeConversationCancelProcess)(