liblloyal/chat__out_8hpp_source.html

#pragma once


// SPDX-License-Identifier: Apache-2.0

// Copyright 2026 Lloyal Labs


#include "common.hpp"

#include <llama/llama.h>

#include <chat.h>

#include <peg-parser.h>

#include <exception>

#include <string>

#include <vector>


namespace lloyal::chat_out {


struct ToolCall {

  std::string name;

  std::string arguments;

  std::string id;

};


struct ParseResult {

  std::string content;

  std::string reasoning_content;

  std::vector<ToolCall> tool_calls;

};


inline ParseResult parse(

    const std::string& output,

    common_chat_format format,

    common_reasoning_format reasoning_format = COMMON_REASONING_FORMAT_NONE,

    bool is_partial = false,

    const std::string& generation_prompt = "",

    const std::string& parser_data = ""

) {

  ParseResult result;


  try {

    // Build parser params

    common_chat_parser_params syntax;

    syntax.format = format;

    syntax.reasoning_format = reasoning_format;

    syntax.generation_prompt = generation_prompt;


    // Load serialized PEG parser if provided (required for PEG format models)

    if (!parser_data.empty()) {

      syntax.parser.load(parser_data);

    }


    // Call llama.cpp's output parser

    common_chat_msg msg = common_chat_parse(output, is_partial, syntax);


    // Convert to ParseResult

    result.content = msg.content;

    result.reasoning_content = msg.reasoning_content;


    for (const auto& tc : msg.tool_calls) {

      result.tool_calls.push_back({tc.name, tc.arguments, tc.id});

    }


  } catch (const std::exception& e) {

    LLOYAL_LOG_DEBUG("[chat_out::parse] Parse failed: %s, returning raw output", e.what());

    result.content = output;

  }


  return result;

}


inline ParseResult parse(

    const llama_model* model,

    const std::string& output,

    bool is_partial = false

) {

  ParseResult result;


  try {

    // Init templates to detect format

    common_chat_templates_ptr tmpls = common_chat_templates_init(model, "");

    if (!tmpls) {

      result.content = output;

      return result;

    }


    // Apply with empty messages to get format detection

    common_chat_templates_inputs inputs;

    inputs.messages = {{.role = "user", .content = ""}};

    inputs.add_generation_prompt = true;

    inputs.use_jinja = true;


    common_chat_params params = common_chat_templates_apply(tmpls.get(), inputs);


    // Delegate to explicit-format overload

    return parse(output, params.format, COMMON_REASONING_FORMAT_NONE, is_partial,

                 params.generation_prompt);


  } catch (const std::exception& e) {

    LLOYAL_LOG_DEBUG("[chat_out::parse] Auto-detect failed: %s", e.what());

    result.content = output;

    return result;

  }

}


} // namespace lloyal::chat_out


common.hpp

LLOYAL_LOG_DEBUG
#define LLOYAL_LOG_DEBUG(...)
liblloyal - Common definitions and logging
Definition common.hpp:48

lloyal::chat_out
Chat output parsing (tool calls, reasoning, content)
Definition chat_out.hpp:43

lloyal::chat_out::parse
ParseResult parse(const std::string &output, common_chat_format format, common_reasoning_format reasoning_format=COMMON_REASONING_FORMAT_NONE, bool is_partial=false, const std::string &generation_prompt="", const std::string &parser_data="")
Parse model output with explicit format.
Definition chat_out.hpp:143

lloyal::chat_in::FormatResult::reasoning_format
common_reasoning_format reasoning_format
Reasoning format for output parsing.
Definition chat_in.hpp:99

lloyal::chat_out::ParseResult
Result from parsing model output.
Definition chat_out.hpp:78

lloyal::chat_out::ParseResult::tool_calls
std::vector< ToolCall > tool_calls
Extracted tool calls (empty array if none)
Definition chat_out.hpp:81

lloyal::chat_out::ParseResult::content
std::string content
Main response text (visible to user)
Definition chat_out.hpp:79

lloyal::chat_out::ParseResult::reasoning_content
std::string reasoning_content
Extracted thinking/reasoning blocks (empty if none)
Definition chat_out.hpp:80

lloyal::chat_out::ToolCall
A single tool call extracted from model output.
Definition chat_out.hpp:48

lloyal::chat_out::ToolCall::name
std::string name
Tool/function name.
Definition chat_out.hpp:49

lloyal::chat_out::ToolCall::id
std::string id
Tool call ID (may be empty if model doesn't generate IDs)
Definition chat_out.hpp:51

lloyal::chat_out::ToolCall::arguments
std::string arguments
JSON string of arguments.
Definition chat_out.hpp:50