agents-docs/llm__interface_8h_source.html

#pragma once


#include <agents-cpp/types.h>

#include <agents-cpp/tool.h>

#include <agents-cpp/coroutine_utils.h>

#include <functional>

#include <memory>

#include <optional>

#include <vector>


namespace agents {


struct LLMOptions {

    double temperature = 0.7;

    int max_tokens = 1024;

    double top_p = 1.0;

    double presence_penalty = 0.0;

    double frequency_penalty = 0.0;

    int timeout_ms = 30000; // 30 seconds

    std::vector<String> stop_sequences;

    std::optional<JsonObject> response_schema;

    std::optional<String> response_mime_type;

};


class LLMInterface {

public:

    virtual ~LLMInterface() = default;


    virtual std::vector<String> getAvailableModels() = 0;


    virtual void setModel(const String& model) = 0;


    virtual String getModel() const = 0;


    virtual void setApiKey(const String& api_key) = 0;


    virtual void setApiBase(const String& api_base) = 0;


    virtual void setOptions(const LLMOptions& options) = 0;


    virtual LLMOptions getOptions() const = 0;


    virtual LLMResponse complete(const String& prompt);


    virtual LLMResponse complete(const std::vector<Message>& messages);


    virtual LLMResponse completeWithTools(

        const std::vector<Message>& messages,

        const std::vector<JsonObject>& tools_schema

    );


    virtual LLMResponse chat(const std::vector<Message>& messages) = 0;


    virtual LLMResponse chatWithTools(

        const std::vector<Message>& messages,

        const std::vector<std::shared_ptr<Tool>>& tools

    ) = 0;


    virtual void streamChat(

        const std::vector<Message>& messages,

        std::function<void(const String&, bool)> callback

    ) = 0;


    virtual Task<LLMResponse> completeAsync(const String& prompt);


    virtual Task<LLMResponse> completeAsync(const std::vector<Message>& messages);


    virtual Task<LLMResponse> chatAsync(const std::vector<Message>& messages);


    virtual Task<LLMResponse> chatWithToolsAsync(

        const std::vector<Message>& messages,

        const std::vector<std::shared_ptr<Tool>>& tools

    );


    virtual AsyncGenerator<String> streamChatAsync(

        const std::vector<Message>& messages

    );

};


std::shared_ptr<LLMInterface> createLLM(

    const String& provider,

    const String& api_key,

    const String& model = ""

);


} // namespace agents

agents::AsyncGenerator
A minimal AsyncGenerator implementation that doesn't rely on coroutines.
Definition coroutine_utils.h:142

agents::LLMInterface
Interface for language model providers (OpenAI, Anthropic, Google, Ollama)
Definition llm_interface.h:68

agents::LLMInterface::chat
virtual LLMResponse chat(const std::vector< Message > &messages)=0
Generate completion from a list of messages.

agents::LLMInterface::setOptions
virtual void setOptions(const LLMOptions &options)=0
Set options for API calls.

agents::LLMInterface::~LLMInterface
virtual ~LLMInterface()=default
Destructor.

agents::LLMInterface::streamChatAsync
virtual AsyncGenerator< String > streamChatAsync(const std::vector< Message > &messages)
Stream chat with AsyncGenerator.

agents::LLMInterface::setModel
virtual void setModel(const String &model)=0
Set the model to use.

agents::LLMInterface::setApiKey
virtual void setApiKey(const String &api_key)=0
Set API key.

agents::LLMInterface::completeAsync
virtual Task< LLMResponse > completeAsync(const std::vector< Message > &messages)
Async complete from a list of messages.

agents::LLMInterface::getAvailableModels
virtual std::vector< String > getAvailableModels()=0
Get available models from this provider.

agents::LLMInterface::getOptions
virtual LLMOptions getOptions() const =0
Get current options.

agents::LLMInterface::completeAsync
virtual Task< LLMResponse > completeAsync(const String &prompt)
Async complete from a prompt.

agents::LLMInterface::setApiBase
virtual void setApiBase(const String &api_base)=0
Set API base URL (for self-hosted or proxied endpoints)

agents::LLMInterface::complete
virtual LLMResponse complete(const std::vector< Message > &messages)
Generate completion from a list of messages.

agents::LLMInterface::completeWithTools
virtual LLMResponse completeWithTools(const std::vector< Message > &messages, const std::vector< JsonObject > &tools_schema)
Generate completion with available tools.

agents::LLMInterface::complete
virtual LLMResponse complete(const String &prompt)
Generate completion from a prompt.

agents::LLMInterface::chatWithTools
virtual LLMResponse chatWithTools(const std::vector< Message > &messages, const std::vector< std::shared_ptr< Tool > > &tools)=0
Generate completion with available tools.

agents::LLMInterface::streamChat
virtual void streamChat(const std::vector< Message > &messages, std::function< void(const String &, bool)> callback)=0
Stream results with callback.

agents::LLMInterface::getModel
virtual String getModel() const =0
Get current model.

agents::LLMInterface::chatAsync
virtual Task< LLMResponse > chatAsync(const std::vector< Message > &messages)
Async chat from a list of messages.

agents::LLMInterface::chatWithToolsAsync
virtual Task< LLMResponse > chatWithToolsAsync(const std::vector< Message > &messages, const std::vector< std::shared_ptr< Tool > > &tools)
Async chat with tools.

agents::Task
Provide a future-based fallback for Task.
Definition coroutine_utils.h:115

agents::tools
Tools Namespace.
Definition file_tool.h:15

agents
Framework Namespace.
Definition agent.h:18

agents::createLLM
std::shared_ptr< LLMInterface > createLLM(const String &provider, const String &api_key, const String &model="")
Factory function to create a specific LLM provider.

agents::String
std::string String
String type.
Definition types.h:27

agents::LLMOptions
Options for LLM API calls.
Definition llm_interface.h:25

agents::LLMOptions::presence_penalty
double presence_penalty
The presence penalty of the LLM.
Definition llm_interface.h:41

agents::LLMOptions::response_mime_type
std::optional< String > response_mime_type
Response MIME type for structured output.
Definition llm_interface.h:62

agents::LLMOptions::top_p
double top_p
The top p of the LLM.
Definition llm_interface.h:37

agents::LLMOptions::temperature
double temperature
The temperature of the LLM.
Definition llm_interface.h:29

agents::LLMOptions::max_tokens
int max_tokens
The maximum number of tokens.
Definition llm_interface.h:33

agents::LLMOptions::response_schema
std::optional< JsonObject > response_schema
Response schema for structured output (JSON schema)
Definition llm_interface.h:57

agents::LLMOptions::stop_sequences
std::vector< String > stop_sequences
The stop sequences of the LLM.
Definition llm_interface.h:53

agents::LLMOptions::frequency_penalty
double frequency_penalty
The frequency penalty of the LLM.
Definition llm_interface.h:45

agents::LLMOptions::timeout_ms
int timeout_ms
The timeout in milliseconds.
Definition llm_interface.h:49

agents::LLMResponse
Response from an LLM.
Definition types.h:85