d9/d17/ollama__ai__service_8cc_source.html

#include "cli/service/ai/ollama_ai_service.h"


#include <cstdlib>

#include <iostream>


#include "absl/strings/str_cat.h"

#include "absl/strings/str_format.h"

#include "cli/service/agent/conversational_agent_service.h"


#ifdef YAZE_WITH_JSON

#include "httplib.h"

#include "nlohmann/json.hpp"

#endif


namespace yaze {

namespace cli {


OllamaAIService::OllamaAIService(const OllamaConfig& config) : config_(config) {

  // Load command documentation into prompt builder

  if (auto status = prompt_builder_.LoadResourceCatalogue(""); !status.ok()) {

    std::cerr << "⚠️  Failed to load agent prompt catalogue: "

              << status.message() << std::endl;

  }


  if (config_.system_prompt.empty()) {

    // Use enhanced prompting by default

    if (config_.use_enhanced_prompting) {

      config_.system_prompt = prompt_builder_.BuildSystemInstructionWithExamples();

    } else {

      config_.system_prompt = BuildSystemPrompt();

    }

  }

}


std::string OllamaAIService::BuildSystemPrompt() {

  // Fallback prompt if enhanced prompting is disabled

  // Use PromptBuilder's basic system instruction

  return prompt_builder_.BuildSystemInstruction();

}


void OllamaAIService::SetRomContext(Rom* rom) {

  prompt_builder_.SetRom(rom);

}


absl::Status OllamaAIService::CheckAvailability() {

#ifndef YAZE_WITH_JSON

  return absl::UnimplementedError(

      "Ollama service requires JSON support. "

      "Build with -DZ3ED_AI=ON or -DYAZE_WITH_JSON=ON");

#else

  try {

    httplib::Client cli(config_.base_url);

    cli.set_connection_timeout(5);  // 5 second timeout


    auto res = cli.Get("/api/tags");

    if (!res) {

      return absl::UnavailableError(absl::StrFormat(

          "Cannot connect to Ollama server at %s.\n"

          "Make sure Ollama is installed and running:\n"

          "  1. Install: brew install ollama (macOS) or https://ollama.com/download\n"

          "  2. Start: ollama serve\n"

          "  3. Verify: curl http://localhost:11434/api/tags",

          config_.base_url));

    }


    if (res->status != 200) {

      return absl::InternalError(absl::StrFormat(

          "Ollama server error: HTTP %d\nResponse: %s",

          res->status, res->body));

    }


    // Check if requested model is available

    nlohmann::json models_json = nlohmann::json::parse(res->body);

    bool model_found = false;


    if (models_json.contains("models") && models_json["models"].is_array()) {

      for (const auto& model : models_json["models"]) {

        if (model.contains("name")) {

          std::string model_name = model["name"].get<std::string>();

          if (model_name.find(config_.model) != std::string::npos) {

            model_found = true;

            break;

          }

        }

      }

    }


    if (!model_found) {

      return absl::NotFoundError(absl::StrFormat(

          "Model '%s' not found on Ollama server.\n"

          "Pull it with: ollama pull %s\n"

          "Available models: ollama list",

          config_.model, config_.model));

    }


    return absl::OkStatus();

  } catch (const std::exception& e) {

    return absl::InternalError(absl::StrCat(

        "Ollama health check failed: ", e.what()));

  }

#endif

}


absl::StatusOr<std::vector<std::string>> OllamaAIService::ListAvailableModels() {

#ifndef YAZE_WITH_JSON

  return absl::UnimplementedError("Requires httplib and JSON support");

#else

  try {

    httplib::Client cli(config_.base_url);

    cli.set_connection_timeout(5);


    auto res = cli.Get("/api/tags");


    if (!res || res->status != 200) {

      return absl::UnavailableError(

          "Cannot list Ollama models. Is the server running?");

    }


    nlohmann::json models_json = nlohmann::json::parse(res->body);

    std::vector<std::string> models;


    if (models_json.contains("models") && models_json["models"].is_array()) {

      for (const auto& model : models_json["models"]) {

        if (model.contains("name")) {

          models.push_back(model["name"].get<std::string>());

        }

      }

    }


    return models;

  } catch (const std::exception& e) {

    return absl::InternalError(absl::StrCat(

        "Failed to list models: ", e.what()));

  }

#endif

}


absl::StatusOr<std::string> OllamaAIService::ParseOllamaResponse(

    const std::string& json_response) {

#if !YAZE_HAS_JSON

  return absl::UnimplementedError("Requires JSON support");

#else

  try {

    nlohmann::json response_json = nlohmann::json::parse(json_response);


    if (!response_json.contains("response")) {

      return absl::InvalidArgumentError(

          "Ollama response missing 'response' field");

    }


    return response_json["response"].get<std::string>();

  } catch (const nlohmann::json::exception& e) {

    return absl::InternalError(absl::StrCat(

        "Failed to parse Ollama response: ", e.what()));

  }

#endif

}


absl::StatusOr<AgentResponse> OllamaAIService::GenerateResponse(

    const std::string& prompt) {

  return GenerateResponse({{{agent::ChatMessage::Sender::kUser, prompt, absl::Now()}}});

}


absl::StatusOr<AgentResponse> OllamaAIService::GenerateResponse(

    const std::vector<agent::ChatMessage>& history) {

#ifndef YAZE_WITH_JSON

  return absl::UnimplementedError(

      "Ollama service requires httplib and JSON support. "

      "Install vcpkg dependencies or use bundled libraries.");

#else

  // TODO: Implement history-aware prompting.

  if (history.empty()) {

    return absl::InvalidArgumentError("History cannot be empty.");

  }

  std::string prompt = prompt_builder_.BuildPromptFromHistory(history);


  // Build request payload

  nlohmann::json request_body = {

      {"model", config_.model},

      {"system", config_.system_prompt},

      {"prompt", prompt},

      {"stream", false},

      {"options",

       {{"temperature", config_.temperature},

        {"num_predict", config_.max_tokens}}},

      {"format", "json"}  // Force JSON output

  };


  try {

    httplib::Client cli(config_.base_url);

    cli.set_read_timeout(60);  // Longer timeout for inference


    auto res = cli.Post("/api/generate", request_body.dump(), "application/json");


    if (!res) {

      return absl::UnavailableError(

          "Failed to connect to Ollama. Is 'ollama serve' running?\n"

          "Start with: ollama serve");

    }


    if (res->status != 200) {

      return absl::InternalError(absl::StrFormat(

          "Ollama API error: HTTP %d\nResponse: %s",

          res->status, res->body));

    }


    // Parse Ollama's wrapper JSON

    nlohmann::json ollama_wrapper;

    try {

      ollama_wrapper = nlohmann::json::parse(res->body);

    } catch (const nlohmann::json::exception& e) {

      return absl::InternalError(absl::StrFormat(

          "Failed to parse Ollama response: %s\nBody: %s",

          e.what(), res->body));

    }


    // Extract the LLM's response from Ollama's "response" field

    if (!ollama_wrapper.contains("response") || !ollama_wrapper["response"].is_string()) {

      return absl::InvalidArgumentError(

          "Ollama response missing 'response' field");

    }


    std::string llm_output = ollama_wrapper["response"].get<std::string>();


    // Debug: Print raw LLM output when verbose mode is enabled

    const char* verbose_env = std::getenv("Z3ED_VERBOSE");

    if (verbose_env && std::string(verbose_env) == "1") {

      std::cout << "\n" << "\033[35m" << "🔍 Raw LLM Response:" << "\033[0m" << "\n"

                << "\033[2m" << llm_output << "\033[0m" << "\n\n";

    }


    // Parse the LLM's JSON response (the agent structure)

    nlohmann::json response_json;

    try {

      response_json = nlohmann::json::parse(llm_output);

    } catch (const nlohmann::json::exception& e) {

      // Sometimes the LLM includes extra text - try to extract JSON object

      size_t start = llm_output.find('{');

      size_t end = llm_output.rfind('}');


      if (start != std::string::npos && end != std::string::npos && end > start) {

        std::string json_only = llm_output.substr(start, end - start + 1);

        try {

          response_json = nlohmann::json::parse(json_only);

        } catch (const nlohmann::json::exception&) {

          return absl::InvalidArgumentError(

              "LLM did not return valid JSON. Response:\n" + llm_output);

        }

      } else {

        return absl::InvalidArgumentError(

            "LLM did not return a JSON object. Response:\n" + llm_output);

      }

    }


    AgentResponse agent_response;

    if (response_json.contains("text_response") &&

        response_json["text_response"].is_string()) {

      agent_response.text_response =

          response_json["text_response"].get<std::string>();

    }

    if (response_json.contains("reasoning") &&

        response_json["reasoning"].is_string()) {

      agent_response.reasoning = response_json["reasoning"].get<std::string>();

    }

    if (response_json.contains("tool_calls") &&

        response_json["tool_calls"].is_array()) {

      for (const auto& call : response_json["tool_calls"]) {

        if (call.contains("tool_name") && call["tool_name"].is_string()) {

          ToolCall tool_call;

          tool_call.tool_name = call["tool_name"].get<std::string>();

          if (call.contains("args") && call["args"].is_object()) {

            for (auto& [key, value] : call["args"].items()) {

              if (value.is_string()) {

                tool_call.args[key] = value.get<std::string>();

              }

            }

          }

          agent_response.tool_calls.push_back(tool_call);

        }

      }

    }

    if (response_json.contains("commands") &&

        response_json["commands"].is_array()) {

      for (const auto& cmd : response_json["commands"]) {

        if (cmd.is_string()) {

          agent_response.commands.push_back(cmd.get<std::string>());

        }

      }

    }


    return agent_response;


  } catch (const std::exception& e) {

    return absl::InternalError(

        absl::StrCat("Ollama request failed: ", e.what()));

  }

#endif

}


}  // namespace cli

}  // namespace yaze

yaze::Rom
The Rom class is used to load, save, and modify Rom data.
Definition rom.h:74

yaze::cli::OllamaAIService::CheckAvailability
absl::Status CheckAvailability()
Definition ollama_ai_service.cc:45

yaze::cli::OllamaAIService::SetRomContext
void SetRomContext(Rom *rom) override
Definition ollama_ai_service.cc:41

yaze::cli::OllamaAIService::config_
OllamaConfig config_
Definition ollama_ai_service.h:44

yaze::cli::OllamaAIService::GenerateResponse
absl::StatusOr< AgentResponse > GenerateResponse(const std::string &prompt) override
Definition ollama_ai_service.cc:159

yaze::cli::OllamaAIService::prompt_builder_
PromptBuilder prompt_builder_
Definition ollama_ai_service.h:45

yaze::cli::OllamaAIService::ListAvailableModels
absl::StatusOr< std::vector< std::string > > ListAvailableModels()
Definition ollama_ai_service.cc:104

yaze::cli::OllamaAIService::ParseOllamaResponse
absl::StatusOr< std::string > ParseOllamaResponse(const std::string &json_response)
Definition ollama_ai_service.cc:138

yaze::cli::OllamaAIService::OllamaAIService
OllamaAIService(const OllamaConfig &config)
Definition ollama_ai_service.cc:18

yaze::cli::OllamaAIService::BuildSystemPrompt
std::string BuildSystemPrompt()
Definition ollama_ai_service.cc:35

yaze::cli::PromptBuilder::SetRom
void SetRom(Rom *rom)
Definition prompt_builder.h:68

yaze::cli::PromptBuilder::BuildSystemInstructionWithExamples
std::string BuildSystemInstructionWithExamples()
Definition prompt_builder.cc:680

yaze::cli::PromptBuilder::BuildPromptFromHistory
std::string BuildPromptFromHistory(const std::vector< agent::ChatMessage > &history)
Definition prompt_builder.cc:706

yaze::cli::PromptBuilder::BuildSystemInstruction
std::string BuildSystemInstruction()
Definition prompt_builder.cc:625

yaze::cli::PromptBuilder::LoadResourceCatalogue
absl::Status LoadResourceCatalogue(const std::string &yaml_path)
Definition prompt_builder.cc:111

conversational_agent_service.h

yaze
Main namespace for the application.
Definition controller.cc:20

ollama_ai_service.h

yaze::cli::AgentResponse
Definition common.h:18

yaze::cli::AgentResponse::commands
std::vector< std::string > commands
Definition common.h:26

yaze::cli::AgentResponse::reasoning
std::string reasoning
Definition common.h:29

yaze::cli::AgentResponse::tool_calls
std::vector< ToolCall > tool_calls
Definition common.h:23

yaze::cli::AgentResponse::text_response
std::string text_response
Definition common.h:20

yaze::cli::OllamaConfig
Definition ollama_ai_service.h:16

yaze::cli::OllamaConfig::use_enhanced_prompting
bool use_enhanced_prompting
Definition ollama_ai_service.h:22

yaze::cli::OllamaConfig::max_tokens
int max_tokens
Definition ollama_ai_service.h:20

yaze::cli::OllamaConfig::system_prompt
std::string system_prompt
Definition ollama_ai_service.h:21

yaze::cli::OllamaConfig::temperature
float temperature
Definition ollama_ai_service.h:19

yaze::cli::OllamaConfig::base_url
std::string base_url
Definition ollama_ai_service.h:17

yaze::cli::OllamaConfig::model
std::string model
Definition ollama_ai_service.h:18

yaze::cli::ToolCall
Definition common.h:12

yaze::cli::ToolCall::args
std::map< std::string, std::string > args
Definition common.h:14

yaze::cli::ToolCall::tool_name
std::string tool_name
Definition common.h:13

yaze::cli::agent::ChatMessage::Sender::kUser
@ kUser