I've integrated web search into the LLM Chat. Here's what I did:

- I added a WebSearchService to call the Tavily API. - I modified the LlmChatViewModel to use the WebSearchService to augment your queries with web search results (using a placeholder API key). - I added UI feedback for web search status (loading, errors, no results). - I updated the ViewModelProvider to correctly inject the WebSearchService into the LlmChatViewModel and LlmAskImageViewModel.
2025-07-17 11:46:39 -04:00 · 2025-05-25 06:18:26 +00:00 · 2025-05-25 06:18:26 +00:00 · 2ed268e5ce
commit 2ed268e5ce
parent ebb605131d
3 changed files with 183 additions and 8 deletions
--- a/Android/src/app/src/main/java/com/google/ai/edge/gallery/data/WebSearchService.kt
+++ b/Android/src/app/src/main/java/com/google/ai/edge/gallery/data/WebSearchService.kt
@ -0,0 +1,100 @@
 package com.google.ai.edge.gallery.data
 import android.util.Log
 import kotlinx.coroutines.Dispatchers
 import kotlinx.coroutines.withContext
 import okhttp3.MediaType.Companion.toMediaTypeOrNull
 import okhttp3.OkHttpClient
 import okhttp3.Request
 import okhttp3.RequestBody.Companion.toRequestBody
 import org.json.JSONObject
 import java.io.IOException
 data class TavilySearchResult(
    val title: String,
    val url: String,
    val content: String,
    val score: Double
 )
 data class TavilySearchResponse(
    val answer: String?,
    val query: String?,
    val results: List<TavilySearchResult>?
 )
 class WebSearchService {
    private val client = OkHttpClient()
    suspend fun search(apiKey: String, query: String): TavilySearchResponse? {
        return withContext(Dispatchers.IO) {
            try {
                val jsonRequestBody = JSONObject().apply {
                    put("api_key", apiKey)
                    put("query", query)
                    put("search_depth", "basic")
                    put("include_answer", true)
                    put("max_results", 3)
                    // include_domains and exclude_domains are empty by default
                }.toString()
                val request = Request.Builder()
                    .url("https://api.tavily.com/search")
                    .header("Authorization", "Bearer $apiKey")
                    .header("Content-Type", "application/json")
                    .post(jsonRequestBody.toRequestBody("application/json; charset=utf-8".toMediaTypeOrNull()))
                    .build()
                client.newCall(request).execute().use { response ->
                    if (!response.isSuccessful) {
                        Log.e("WebSearchService", "API Error: ${response.code} ${response.message}")
                        return@withContext null
                    }
                    val responseBody = response.body?.string()
                    if (responseBody == null) {
                        Log.e("WebSearchService", "Empty response body")
                        return@withContext null
                    }
                    parseTavilyResponse(responseBody)
                }
            } catch (e: IOException) {
                Log.e("WebSearchService", "Network Error: ${e.message}", e)
                null
            } catch (e: Exception) {
                Log.e("WebSearchService", "Error during search: ${e.message}", e)
                null
            }
        }
    }
    private fun parseTavilyResponse(responseBody: String): TavilySearchResponse? {
        return try {
            val jsonObject = JSONObject(responseBody)
            val answer = jsonObject.optString("answer", null)
            val query = jsonObject.optString("query", null)
            val resultsArray = jsonObject.optJSONArray("results")
            val searchResults = mutableListOf<TavilySearchResult>()
            if (resultsArray != null) {
                for (i in 0 until resultsArray.length()) {
                    val resultObj = resultsArray.getJSONObject(i)
                    searchResults.add(
                        TavilySearchResult(
                            title = resultObj.getString("title"),
                            url = resultObj.getString("url"),
                            content = resultObj.getString("content"),
                            score = resultObj.getDouble("score")
                        )
                    )
                }
            }
            TavilySearchResponse(answer, query, if (searchResults.isEmpty()) null else searchResults)
        } catch (e: Exception) {
            Log.e("WebSearchService", "Error parsing JSON response: ${e.message}", e)
            null
        }
    }
 }
--- a/Android/src/app/src/main/java/com/google/ai/edge/gallery/ui/ViewModelProvider.kt
+++ b/Android/src/app/src/main/java/com/google/ai/edge/gallery/ui/ViewModelProvider.kt
@ -22,6 +22,7 @@ import androidx.lifecycle.viewmodel.CreationExtras
 import androidx.lifecycle.viewmodel.initializer
 import androidx.lifecycle.viewmodel.viewModelFactory
 import com.google.ai.edge.gallery.GalleryApplication
 import com.google.ai.edge.gallery.data.WebSearchService
 import com.google.ai.edge.gallery.ui.imageclassification.ImageClassificationViewModel
 import com.google.ai.edge.gallery.ui.imagegeneration.ImageGenerationViewModel
 import com.google.ai.edge.gallery.ui.llmchat.LlmChatViewModel
@ -32,6 +33,10 @@ import com.google.ai.edge.gallery.ui.textclassification.TextClassificationViewMo
 object ViewModelProvider {
  val Factory = viewModelFactory {
    // Create an instance of WebSearchService
    // This instance will be shared by ViewModels that need it.
    val webSearchService = WebSearchService()
    // Initializer for ModelManagerViewModel.
    initializer {
      val downloadRepository = galleryApplication().container.downloadRepository
@ -55,17 +60,21 @@ object ViewModelProvider {
    // Initializer for LlmChatViewModel.
    initializer {
-      LlmChatViewModel()
+      // Pass the WebSearchService instance
      LlmChatViewModel(webSearchService = webSearchService)
    }
-    // Initializer for LlmSingleTurnViewModel..
+    // Initializer for LlmSingleTurnViewModel.
    // Note: LlmSingleTurnViewModel's constructor was not modified in previous steps.
    // If it also needs WebSearchService in the future, its initializer and constructor would need similar changes.
    initializer {
      LlmSingleTurnViewModel()
    }
    // Initializer for LlmAskImageViewModel.
    initializer {
-      LlmAskImageViewModel()
+      // Pass the WebSearchService instance
      LlmAskImageViewModel(webSearchService = webSearchService)
    }
    // Initializer for ImageGenerationViewModel.
--- a/Android/src/app/src/main/java/com/google/ai/edge/gallery/ui/llmchat/LlmChatViewModel.kt
+++ b/Android/src/app/src/main/java/com/google/ai/edge/gallery/ui/llmchat/LlmChatViewModel.kt
@ -25,6 +25,7 @@ import com.google.ai.edge.gallery.data.Model
 import com.google.ai.edge.gallery.data.TASK_LLM_CHAT
 import com.google.ai.edge.gallery.data.TASK_LLM_ASK_IMAGE
 import com.google.ai.edge.gallery.data.Task
 import com.google.ai.edge.gallery.data.WebSearchService
 import com.google.ai.edge.gallery.ui.common.chat.ChatMessageBenchmarkLlmResult
 import com.google.ai.edge.gallery.ui.common.chat.ChatMessageLoading
 import com.google.ai.edge.gallery.ui.common.chat.ChatMessageText
@ -46,10 +47,71 @@ private val STATS = listOf(
  Stat(id = "latency", label = "Latency", unit = "sec")
 )
-open class LlmChatViewModel(curTask: Task = TASK_LLM_CHAT) : ChatViewModel(task = curTask) {
+open class LlmChatViewModel(
  curTask: Task = TASK_LLM_CHAT,
  private val webSearchService: WebSearchService
 ) : ChatViewModel(task = curTask) {
  fun generateResponse(model: Model, input: String, image: Bitmap? = null, onError: () -> Unit) {
    val accelerator = model.getStringConfigValue(key = ConfigKey.ACCELERATOR, defaultValue = "")
    viewModelScope.launch(Dispatchers.Default) {
      // Web Search Logic
      var augmentedInput = input
      var searchPerformed = false
      var searchSuccessful = false
      var searchErrorOccurred = false
      // Add search in-progress indicator
      val searchIndicatorMessage = ChatMessageLoading(
          text = "正在為您搜索網路獲取最新資訊...",
          accelerator = accelerator,
          side = ChatSide.AGENT
      )
      addMessage(model = model, message = searchIndicatorMessage)
      try {
        val tavilyResponse = webSearchService.search(apiKey = "YOUR_TAVILY_API_KEY_PLACEHOLDER", query = input)
        searchPerformed = true
        if (tavilyResponse != null) {
          searchSuccessful = true
          val searchAnswer = tavilyResponse.answer
          val searchResults = tavilyResponse.results
          if (!searchAnswer.isNullOrBlank()) {
            augmentedInput = "Based on web search results, answer the following: \"${searchAnswer}\". The original question was: \"${input}\""
          } else if (!searchResults.isNullOrEmpty()) {
            val snippets = searchResults.take(2).joinToString(separator = "; ") { it.content }
            if (snippets.isNotBlank()) {
              augmentedInput = "Based on web search results, here are some relevant snippets: \"${snippets}\". The original question was: \"${input}\""
            }
          }
        } else {
          searchErrorOccurred = true
        }
      } catch (e: Exception) {
        Log.e(TAG, "Web search call failed", e)
        searchErrorOccurred = true
      }
      // Remove search in-progress indicator
      val lastMessage = getLastMessage(model = model)
      if (lastMessage == searchIndicatorMessage) {
          removeLastMessage(model = model)
      }
      // Add search result status messages
      if (searchErrorOccurred) {
          addMessage(
              model = model,
              message = ChatMessageWarning(content = "網路搜索失敗，將嘗試使用模型知識回答。")
          )
      } else if (searchPerformed && !searchSuccessful) {
          addMessage(
              model = model,
              message = ChatMessageWarning(content = "網路搜索未能找到相關資訊，將嘗試使用模型知識回答。")
          )
      }
      setInProgress(true)
      setPreparing(true)
@ -67,9 +129,11 @@ open class LlmChatViewModel(curTask: Task = TASK_LLM_CHAT) : ChatViewModel(task
      // Run inference.
      val instance = model.instance as LlmModelInstance
-      var prefillTokens = instance.session.sizeInTokens(input)
+      var prefillTokens = instance.session.sizeInTokens(augmentedInput)
      if (image != null) {
-        prefillTokens += 257
+        // Assuming image context is added separately and not part of the text prompt for token calculation here.
        // If image contributes to text prompt for LLM, this might need adjustment or be handled by the model instance.
        prefillTokens += 257 // This is a magic number, ensure it's correct for multimodal inputs.
      }
      var firstRun = true
@ -82,7 +146,7 @@ open class LlmChatViewModel(curTask: Task = TASK_LLM_CHAT) : ChatViewModel(task
      try {
        LlmChatModelHelper.runInference(model = model,
-          input = input,
+          input = augmentedInput, // Use augmentedInput here
          image = image,
          resultListener = { partialResult, done ->
            val curTs = System.currentTimeMillis()
@ -241,8 +305,10 @@ open class LlmChatViewModel(curTask: Task = TASK_LLM_CHAT) : ChatViewModel(task
    )
    // Re-generate the response automatically.
    // The original triggeredMessage.content will go through the search logic again.
    generateResponse(model = model, input = triggeredMessage.content, onError = {})
  }
 }
-class LlmAskImageViewModel : LlmChatViewModel(curTask = TASK_LLM_ASK_IMAGE)
+class LlmAskImageViewModel(webSearchService: WebSearchService) :
  LlmChatViewModel(curTask = TASK_LLM_ASK_IMAGE, webSearchService = webSearchService)