diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml index bcfac0a27..c5dcb02e2 100644 --- a/.github/workflows/CI.yml +++ b/.github/workflows/CI.yml @@ -37,6 +37,13 @@ jobs: arch: ${{ matrix.arch }} - uses: julia-actions/cache@v1 - uses: julia-actions/julia-buildpkg@v1 + - name: Install test dependencies + run: | + julia --project=test -e ' + using Pkg; + Pkg.develop(PackageSpec(path=pwd())); + Pkg.instantiate(); + Pkg.precompile()' - uses: julia-actions/julia-runtest@v1 - uses: julia-actions/julia-processcoverage@v1 - uses: codecov/codecov-action@v4 @@ -67,4 +74,4 @@ jobs: env: GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} # For authentication with GitHub Actions token GKSwstype: "100" # for Plots.jl plots (if you have them) - JULIA_DEBUG: "Documenter" \ No newline at end of file + JULIA_DEBUG: "Documenter" diff --git a/Project.toml b/Project.toml index 0e450fa1b..770bc6b1e 100644 --- a/Project.toml +++ b/Project.toml @@ -53,6 +53,7 @@ PrecompileTools = "1" Preferences = "1" REPL = "<0.0.1, 1" Random = "<0.0.1, 1" +Snowball = "0.1" SparseArrays = "<0.0.1, 1" Statistics = "<0.0.1, 1" StreamCallbacks = "0.4, 0.5" @@ -61,10 +62,13 @@ julia = "1.9, 1.10" [extras] Aqua = "4c88cf16-eb10-579e-8560-4a9242c79595" +HTTP = "cd3eb016-35fb-5094-929b-558a96fad6f3" +JSON3 = "0f8b85d8-7281-11e9-16c2-39a750bddbf1" LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" +OpenAI = "e9f21f70-7185-4079-aca2-91159181367c" SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf" Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2" Unicode = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" [targets] -test = ["Aqua", "FlashRank", "SparseArrays", "Statistics", "LinearAlgebra", "Markdown", "Snowball", "Unicode"] +test = ["Aqua", "FlashRank", "SparseArrays", "Statistics", "LinearAlgebra", "Markdown", "Snowball", "Unicode", "HTTP", "JSON3", "OpenAI"] diff --git a/src/constants.jl b/src/constants.jl new file mode 100644 index 000000000..54b0a61b2 --- /dev/null +++ b/src/constants.jl @@ -0,0 +1,23 @@ +# Constants used throughout the package + +# Model Registry +const MODEL_REGISTRY = Dict{String,Any}() + +# Default Models +const MODEL_CHAT = "gpt-3.5-turbo" +const MODEL_COMPLETION = "gpt-3.5-turbo-instruct" + +# Reserved keywords that cannot be used as placeholders in templates +const RESERVED_KWARGS = Symbol[ + :model, :api_key, :verbose, :return_all, :dry_run, :conversation, + :streamcallback, :no_system_message, :name_user, :name_assistant, + :http_kwargs, :api_kwargs +] + +# Default system message +const DEFAULT_SYSTEM_MESSAGE = "You are a helpful AI assistant." + +# Default API Keys +const OPENAI_API_KEY = get(ENV, "OPENAI_API_KEY", "") +const ANTHROPIC_API_KEY = get(ENV, "ANTHROPIC_API_KEY", "") +const GOOGLE_API_KEY = get(ENV, "GOOGLE_API_KEY", "") diff --git a/src/llm_shared.jl b/src/llm_shared.jl index fcb6e5702..203bf3566 100644 --- a/src/llm_shared.jl +++ b/src/llm_shared.jl @@ -73,6 +73,9 @@ function render(schema::NoSchema, count_system_msg += 1 # move to the front pushfirst!(conversation, msg) + elseif isabstractannotationmessage(msg) + # Silently skip annotation messages - they are not meant for LLM consumption + continue else # Note: Ignores any DataMessage or other types for the prompt/conversation history @warn "Unexpected message type: $(typeof(msg)). Skipping." diff --git a/src/messages.jl b/src/messages.jl index acc6e2a39..edc248d55 100644 --- a/src/messages.jl +++ b/src/messages.jl @@ -5,9 +5,26 @@ abstract type AbstractMessage end abstract type AbstractChatMessage <: AbstractMessage end # with text-based content abstract type AbstractDataMessage <: AbstractMessage end # with data-based content, eg, embeddings abstract type AbstractTracerMessage{T <: AbstractMessage} <: AbstractMessage end # message with annotation that exposes the underlying message +abstract type AbstractAnnotationMessage <: AbstractMessage end # message with metadata that is never sent to LLMs + +""" + isabstractannotationmessage(msg::AbstractMessage) + +Check if a message is an AbstractAnnotationMessage. +These messages are never sent to LLMs and are used for metadata and documentation. +""" +isabstractannotationmessage(msg::AbstractMessage) = msg isa AbstractAnnotationMessage + # Complementary type for tracing, follows the same API as TracerMessage abstract type AbstractTracer{T <: Any} end +""" + get_run_id() + +Generate a random run ID for message tracking. +""" +get_run_id() = Int(rand(Int16)) + ## Allowed inputs for ai* functions, AITemplate is resolved one level higher const ALLOWED_PROMPT_TYPE = Union{ AbstractString, @@ -24,26 +41,49 @@ Base.@kwdef struct MetadataMessage{T <: AbstractString} <: AbstractChatMessage source::String = "" _type::Symbol = :metadatamessage end + +""" + SystemMessage + +A message type for system-level instructions and context. +Used to set the behavior and context for AI models. + +# Fields +- `content::T`: The content of the message +- `variables::Vector{Symbol}`: Variables extracted from content +- `run_id::Union{Nothing,Int}`: Unique identifier for the message +- `_type::Symbol`: Message type identifier +""" Base.@kwdef struct SystemMessage{T <: AbstractString} <: AbstractChatMessage content::T - variables::Vector{Symbol} = _extract_handlebar_variables(content) + variables::Vector{Symbol} = begin + vars = _extract_handlebar_variables(content) + not_allowed = intersect(vars, RESERVED_KWARGS) + @assert length(not_allowed)==0 "Error: Some placeholders are invalid, as they are reserved for `ai*` functions. Change: $(join(not_allowed,","))" + vars + end + run_id::Union{Nothing,Int} = get_run_id() _type::Symbol = :systemmessage - SystemMessage{T}(c, v, t) where {T <: AbstractString} = new(c, v, t) end -function SystemMessage(content::T, - variables::Vector{Symbol}, - type::Symbol) where {T <: AbstractString} + +# Single constructor for string-only input +function SystemMessage(content::T) where {T <: AbstractString} + SystemMessage{T}(; content=content) +end + +function SystemMessage(content::T; kwargs...) where {T <: AbstractString} + variables = get(kwargs, :variables, _extract_handlebar_variables(content)) not_allowed_kwargs = intersect(variables, RESERVED_KWARGS) @assert length(not_allowed_kwargs)==0 "Error: Some placeholders are invalid, as they are reserved for `ai*` functions. Change: $(join(not_allowed_kwargs,","))" - return SystemMessage{T}(content, variables, type) + SystemMessage{T}(; content=content, kwargs...) end """ UserMessage -A message type for user-generated text-based responses. +A message type for user-generated text-based responses. Consumed by `ai*` functions to generate responses. - + # Fields - `content::T`: The content of the message. - `variables::Vector{Symbol}`: The variables in the message. @@ -68,9 +108,9 @@ end """ UserMessageWithImages -A message type for user-generated text-based responses with images. +A message type for user-generated text-based responses with images. Consumed by `ai*` functions to generate responses. - + # Fields - `content::T`: The content of the message. - `image_url::Vector{String}`: The URLs of the images. @@ -97,9 +137,9 @@ end """ AIMessage -A message type for AI-generated text-based responses. +A message type for AI-generated text-based responses. Returned by `aigenerate`, `aiclassify`, and `aiscan` functions. - + # Fields - `content::Union{AbstractString, Nothing}`: The content of the message. - `status::Union{Int, Nothing}`: The status of the message from the API. @@ -131,9 +171,9 @@ end """ DataMessage -A message type for AI-generated data-based responses, ie, different `content` than text. +A message type for AI-generated data-based responses, ie, different `content` than text. Returned by `aiextract`, and `aiextract` functions. - + # Fields - `content::Union{AbstractString, Nothing}`: The content of the message. - `status::Union{Int, Nothing}`: The status of the message from the API. @@ -163,8 +203,24 @@ end """ ToolMessage -A message type for tool calls. - +A message type for tool calls. + +It represents both the request (fields `args`, `name`) and the response (field `content`). + +# Fields +- `content::Any`: The content of the message. +- `req_id::Union{Nothing, Int}`: The unique ID of the request. +- `tool_call_id::String`: The unique ID of the tool call. +- `raw::AbstractString`: The raw JSON string of the tool call request. +- `args::Union{Nothing, Dict{Symbol, Any}}`: The arguments of the tool call request. +- `name::Union{Nothing, String}`: The name of the tool call request. +""" + +""" + ToolMessage + +A message type for tool calls. + It represents both the request (fields `args`, `name`) and the response (field `content`). # Fields @@ -188,9 +244,9 @@ end """ AIToolRequest -A message type for AI-generated tool requests. +A message type for AI-generated tool requests. Returned by `aitools` functions. - + # Fields - `content::Union{AbstractString, Nothing}`: The content of the message. - `tool_calls::Vector{ToolMessage}`: The vector of tool call requests. @@ -224,11 +280,122 @@ Base.@kwdef struct AIToolRequest{T <: Union{AbstractString, Nothing}} <: Abstrac sample_id::Union{Nothing, Int} = nothing _type::Symbol = :aitoolrequest end -"Get the vector of tool call requests from an AIToolRequest/message." -tool_calls(msg::AIToolRequest) = msg.tool_calls -tool_calls(msg::AbstractMessage) = ToolMessage[] -tool_calls(msg::ToolMessage) = [msg] -tool_calls(msg::AbstractTracerMessage) = tool_calls(msg.object) + +""" + AbstractAnnotationMessage + +Abstract type for messages that provide documentation and metadata without being sent to LLMs. +""" +abstract type AbstractAnnotationMessage <: AbstractChatMessage end + +""" + AnnotationMessage{T} <: AbstractAnnotationMessage + +A message type for adding metadata and documentation to conversation histories without affecting LLM context. + +Fields: +- `content::T`: The main content of the annotation +- `extras::Dict{Symbol,Any}`: Additional metadata as key-value pairs +- `tags::Vector{Symbol}`: Tags for categorizing the annotation +- `comment::String`: Human-readable comment (not used for automatic operations) +- `run_id::Union{Nothing,Int}`: Optional run ID for tracking message provenance +- `_type::Symbol`: Internal type identifier + +The AnnotationMessage is designed to bundle key information and documentation together with conversation data +without sending any of it to large language models. +""" +Base.@kwdef mutable struct AnnotationMessage{T} <: AbstractAnnotationMessage + content::T + extras::Dict{Symbol,Any} = Dict{Symbol,Any}() + tags::Vector{Symbol} = Symbol[] + comment::String = "" + run_id::Union{Nothing,Int} = get_run_id() + _type::Symbol = :annotationmessage +end + +# Constructors for AnnotationMessage +function AnnotationMessage(content; kwargs...) + AnnotationMessage{typeof(content)}(; content=content, kwargs...) +end + +# Specific methods to resolve ambiguities +function AnnotationMessage(content::AbstractString) + AnnotationMessage{typeof(content)}(; content=content) +end + +function AnnotationMessage(msg::AbstractChatMessage) + AnnotationMessage{typeof(msg.content)}(; content=msg.content) +end + +function AnnotationMessage(msg::AbstractTracerMessage{<:AbstractChatMessage}) + AnnotationMessage{typeof(msg.message.content)}(; content=msg.message.content) +end + +""" + annotate!(messages::Vector{<:AbstractMessage}, content; kwargs...) + annotate!(message::AbstractMessage, content; kwargs...) + +Add an annotation message to a vector of messages or wrap a single message in a vector with an annotation. + +The annotation is inserted after any existing annotation messages to maintain logical grouping. +All kwargs are passed to the AnnotationMessage constructor. + +Returns the modified vector of messages. +""" +function annotate!(messages::Vector{<:AbstractMessage}, content; kwargs...) + msg = AnnotationMessage(content; kwargs...) + # Find the last annotation message + last_annotation_idx = findlast(isabstractannotationmessage, messages) + if isnothing(last_annotation_idx) + # No existing annotations, insert at start + insert!(messages, 1, msg) + else + # Insert after last annotation + insert!(messages, last_annotation_idx + 1, msg) + end + return messages +end + +""" + annotate!(msgs::Vector{<:AbstractMessage}, content::String; kwargs...) + +Add an AnnotationMessage to a vector of messages, placing it after any existing annotations. +Returns the modified vector. + +# Arguments +- `msgs`: Vector of messages to annotate +- `content`: Content of the annotation +- `kwargs...`: Additional fields for AnnotationMessage (extras, tags, comment) + +# Example +```julia +msgs = [UserMessage("Hello"), AIMessage("Hi")] +annotate!(msgs, "Conversation start"; tags=[:greeting]) +``` +""" +function annotate!(msgs::Vector{<:AbstractMessage}, content::String; kwargs...) + annotation = AnnotationMessage(content; kwargs...) + # Find the last annotation message index + last_annotation_idx = findlast(isabstractannotationmessage, msgs) + + if isnothing(last_annotation_idx) + # No existing annotations, insert at start + insert!(msgs, 1, annotation) + else + # Insert after the last annotation + insert!(msgs, last_annotation_idx + 1, annotation) + end + return msgs +end + +""" + annotate!(message::AbstractMessage, content; kwargs...) + +Convenience method to annotate a single message by wrapping it in a vector. +""" +function annotate!(message::AbstractMessage, content; kwargs...) + annotate!([message], content; kwargs...) +end ### Other Message methods # content-only constructor @@ -251,6 +418,7 @@ isaimessage(m::Any) = m isa AIMessage istoolmessage(m::Any) = m isa ToolMessage isaitoolrequest(m::Any) = m isa AIToolRequest istracermessage(m::Any) = m isa AbstractTracerMessage +isabstractannotationmessage(m::Any) = m isa AbstractAnnotationMessage isusermessage(m::AbstractTracerMessage) = isusermessage(m.object) isusermessagewithimages(m::AbstractTracerMessage) = isusermessagewithimages(m.object) issystemmessage(m::AbstractTracerMessage) = issystemmessage(m.object) @@ -259,6 +427,29 @@ isaimessage(m::AbstractTracerMessage) = isaimessage(m.object) istoolmessage(m::AbstractTracerMessage) = istoolmessage(m.object) isaitoolrequest(m::AbstractTracerMessage) = isaitoolrequest(m.object) +# Dict conversion for AnnotationMessage +function Base.Dict(msg::AnnotationMessage) + return Dict{String,Any}( + "content" => msg.content, + "extras" => msg.extras, + "tags" => msg.tags, + "comment" => msg.comment, + "run_id" => msg.run_id, + "_type" => msg._type + ) +end + +function Base.convert(::Type{AnnotationMessage}, dict::Dict) + return AnnotationMessage(; + content = dict["content"], + extras = convert(Dict{Symbol,Any}, dict["extras"]), + tags = Symbol.(dict["tags"]), + comment = dict["comment"], + run_id = dict["run_id"], + _type = Symbol(dict["_type"]) + ) +end + # equality check for testing, only equal if all fields are equal and type is the same Base.var"=="(m1::AbstractMessage, m2::AbstractMessage) = false function Base.var"=="(m1::T, m2::T) where {T <: AbstractMessage} @@ -486,6 +677,11 @@ end last_message(msg::AbstractMessage) = msg last_output(msg::AbstractMessage) = msg.content +"Returns a vector of ToolMessage objects associated with the message. For AIToolRequest, returns its tool_calls field; for ToolMessage returns a single-element vector with itself; otherwise returns an empty vector." +tool_calls(msg::AbstractMessage) = ToolMessage[] +tool_calls(msg::ToolMessage) = [msg] +tool_calls(msg::AIToolRequest) = msg.tool_calls + ## Display methods function Base.show(io::IO, ::MIME"text/plain", m::AbstractChatMessage) type_ = string(typeof(m)) |> x -> split(x, "{")[begin] @@ -502,6 +698,34 @@ function Base.show(io::IO, ::MIME"text/plain", m::AbstractChatMessage) end print(io, "(\"", m.content, "\")") end + +function Base.show(io::IO, ::MIME"text/plain", m::AnnotationMessage) + printstyled(io, "AnnotationMessage"; color = :cyan) + print(io, "(\"", m.content[1:min(30, length(m.content))]) + if length(m.content) > 30 + print(io, "...") + end + if !isempty(m.tags) + print(io, "\" [", join(m.tags, ", "), "])") + else + print(io, "\")") + end +end + +function pprint(io::IO, msg::AnnotationMessage) + println(io, "Annotation Message:") + println(io, "Content: ", msg.content) + if !isempty(msg.tags) + println(io, "Tags: ", msg.tags) + end + if !isempty(msg.comment) + println(io, "Comment: ", msg.comment) + end + if !isempty(msg.extras) + println(io, "Extras: ", msg.extras) + end +end + function Base.show(io::IO, ::MIME"text/plain", m::AbstractDataMessage) type_ = string(typeof(m)) |> x -> split(x, "{")[begin] printstyled(io, type_; color = :light_yellow) @@ -537,6 +761,17 @@ end function role4render(schema::AbstractPromptSchema, msg::AbstractTracerMessage) role4render(schema, msg.object) end + +""" + render(schema::NoSchema, messages::Vector{<:AbstractMessage}; kwargs...) + +Base rendering implementation that filters out annotation messages and applies any replacements. +Annotation messages are never sent to LLMs. +""" +function render(schema::NoSchema, messages::Vector{<:AbstractMessage}; kwargs...) + [render(schema, msg; kwargs...) for msg in messages if !isabstractannotationmessage(msg)] +end + function render(schema::AbstractPromptSchema, msg::AbstractMessage; kwargs...) render(schema, [msg]; kwargs...) end @@ -557,7 +792,8 @@ function StructTypes.subtypes(::Type{AbstractMessage}) systemmessage = SystemMessage, metadatamessage = MetadataMessage, datamessage = DataMessage, - tracermessage = TracerMessage) + tracermessage = TracerMessage, + annotationmessage = AnnotationMessage) end StructTypes.StructType(::Type{AbstractChatMessage}) = StructTypes.AbstractType() @@ -592,6 +828,7 @@ StructTypes.StructType(::Type{AIMessage}) = StructTypes.Struct() StructTypes.StructType(::Type{DataMessage}) = StructTypes.Struct() StructTypes.StructType(::Type{TracerMessage}) = StructTypes.Struct() # Ignore mutability once we serialize StructTypes.StructType(::Type{TracerMessageLike}) = StructTypes.Struct() # Ignore mutability once we serialize +StructTypes.StructType(::Type{AnnotationMessage}) = StructTypes.Struct() ### Utilities for Pretty Printing """ @@ -615,6 +852,8 @@ function pprint(io::IO, msg::AbstractMessage; text_width::Int = displaysize(io)[ "AI Tool Request" elseif msg isa ToolMessage "Tool Message" + elseif msg isa AnnotationMessage + "Annotation Message" else "Unknown Message" end @@ -633,6 +872,11 @@ function pprint(io::IO, msg::AbstractMessage; text_width::Int = displaysize(io)[ elseif istoolmessage(msg) isnothing(msg.content) ? string("Name: ", msg.name, ", Args: ", msg.raw) : string(msg.content) + elseif msg isa AnnotationMessage + content_str = wrap_string(msg.content, text_width) + tags_str = isempty(msg.tags) ? "" : "\nTags: " * join(msg.tags, ", ") + comment_str = isempty(msg.comment) ? "" : "\nComment: " * msg.comment + string(content_str, tags_str, comment_str) else wrap_string(msg.content, text_width) end diff --git a/test/Manifest.toml b/test/Manifest.toml new file mode 100644 index 000000000..ca520f947 --- /dev/null +++ b/test/Manifest.toml @@ -0,0 +1,293 @@ +# This file is machine-generated - editing it directly is not advised + +julia_version = "1.10.6" +manifest_format = "2.0" +project_hash = "093ffb813d46516add22ebae3efac690cc486f7d" + +[[deps.AbstractTrees]] +git-tree-sha1 = "2d9c9a55f9c93e8887ad391fbae72f8ef55e1177" +uuid = "1520ce14-60c1-5f80-bbc7-55ef81b5835c" +version = "0.4.5" + +[[deps.ArgTools]] +uuid = "0dad84c5-d112-42e6-8d28-ef12dabb789f" +version = "1.1.1" + +[[deps.Artifacts]] +uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33" + +[[deps.Base64]] +uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f" + +[[deps.BitFlags]] +git-tree-sha1 = "0691e34b3bb8be9307330f88d1a3c3f25466c24d" +uuid = "d1d4a3ce-64b1-5f1a-9ba4-7e7e69966f35" +version = "0.1.9" + +[[deps.CodecZlib]] +deps = ["TranscodingStreams", "Zlib_jll"] +git-tree-sha1 = "bce6804e5e6044c6daab27bb533d1295e4a2e759" +uuid = "944b1d66-785c-5afd-91f1-9de20f533193" +version = "0.7.6" + +[[deps.ConcurrentUtilities]] +deps = ["Serialization", "Sockets"] +git-tree-sha1 = "ea32b83ca4fefa1768dc84e504cc0a94fb1ab8d1" +uuid = "f0e56b4a-5159-44fe-b623-3e5288b988bb" +version = "2.4.2" + +[[deps.Dates]] +deps = ["Printf"] +uuid = "ade2ca70-3891-5945-98fb-dc099432e06a" + +[[deps.Downloads]] +deps = ["ArgTools", "FileWatching", "LibCURL", "NetworkOptions"] +uuid = "f43a241f-c20a-4ad4-852c-f6b1247861c6" +version = "1.6.0" + +[[deps.ExceptionUnwrapping]] +deps = ["Test"] +git-tree-sha1 = "d36f682e590a83d63d1c7dbd287573764682d12a" +uuid = "460bff9d-24e4-43bc-9d9f-a8973cb893f4" +version = "0.1.11" + +[[deps.FileWatching]] +uuid = "7b1f6079-737a-58dc-b8bc-7a2ca5c1b5ee" + +[[deps.HTTP]] +deps = ["Base64", "CodecZlib", "ConcurrentUtilities", "Dates", "ExceptionUnwrapping", "Logging", "LoggingExtras", "MbedTLS", "NetworkOptions", "OpenSSL", "PrecompileTools", "Random", "SimpleBufferStream", "Sockets", "URIs", "UUIDs"] +git-tree-sha1 = "ae350b8225575cc3ea385d4131c81594f86dfe4f" +uuid = "cd3eb016-35fb-5094-929b-558a96fad6f3" +version = "1.10.12" + +[[deps.InteractiveUtils]] +deps = ["Markdown"] +uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240" + +[[deps.JLLWrappers]] +deps = ["Artifacts", "Preferences"] +git-tree-sha1 = "be3dc50a92e5a386872a493a10050136d4703f9b" +uuid = "692b3bcd-3c85-4b1f-b108-f13ce0eb3210" +version = "1.6.1" + +[[deps.JSON3]] +deps = ["Dates", "Mmap", "Parsers", "PrecompileTools", "StructTypes", "UUIDs"] +git-tree-sha1 = "1d322381ef7b087548321d3f878cb4c9bd8f8f9b" +uuid = "0f8b85d8-7281-11e9-16c2-39a750bddbf1" +version = "1.14.1" + + [deps.JSON3.extensions] + JSON3ArrowExt = ["ArrowTypes"] + + [deps.JSON3.weakdeps] + ArrowTypes = "31f734f8-188a-4ce0-8406-c8a06bd891cd" + +[[deps.LibCURL]] +deps = ["LibCURL_jll", "MozillaCACerts_jll"] +uuid = "b27032c2-a3e7-50c8-80cd-2d36dbcbfd21" +version = "0.6.4" + +[[deps.LibCURL_jll]] +deps = ["Artifacts", "LibSSH2_jll", "Libdl", "MbedTLS_jll", "Zlib_jll", "nghttp2_jll"] +uuid = "deac9b47-8bc7-5906-a0fe-35ac56dc84c0" +version = "8.4.0+0" + +[[deps.LibGit2]] +deps = ["Base64", "LibGit2_jll", "NetworkOptions", "Printf", "SHA"] +uuid = "76f85450-5226-5b5a-8eaa-529ad045b433" + +[[deps.LibGit2_jll]] +deps = ["Artifacts", "LibSSH2_jll", "Libdl", "MbedTLS_jll"] +uuid = "e37daf67-58a4-590a-8e99-b0245dd2ffc5" +version = "1.6.4+0" + +[[deps.LibSSH2_jll]] +deps = ["Artifacts", "Libdl", "MbedTLS_jll"] +uuid = "29816b5a-b9ab-546f-933c-edad1886dfa8" +version = "1.11.0+1" + +[[deps.Libdl]] +uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb" + +[[deps.Logging]] +uuid = "56ddb016-857b-54e1-b83d-db4d58db5568" + +[[deps.LoggingExtras]] +deps = ["Dates", "Logging"] +git-tree-sha1 = "f02b56007b064fbfddb4c9cd60161b6dd0f40df3" +uuid = "e6f89c97-d47a-5376-807f-9c37f3926c36" +version = "1.1.0" + +[[deps.Markdown]] +deps = ["Base64"] +uuid = "d6f4376e-aef5-505a-96c1-9c027394607a" + +[[deps.MbedTLS]] +deps = ["Dates", "MbedTLS_jll", "MozillaCACerts_jll", "NetworkOptions", "Random", "Sockets"] +git-tree-sha1 = "c067a280ddc25f196b5e7df3877c6b226d390aaf" +uuid = "739be429-bea8-5141-9913-cc70e7f3736d" +version = "1.1.9" + +[[deps.MbedTLS_jll]] +deps = ["Artifacts", "Libdl"] +uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1" +version = "2.28.2+1" + +[[deps.Mmap]] +uuid = "a63ad114-7e13-5084-954f-fe012c677804" + +[[deps.MozillaCACerts_jll]] +uuid = "14a3606d-f60d-562e-9121-12d972cd8159" +version = "2023.1.10" + +[[deps.NetworkOptions]] +uuid = "ca575930-c2e3-43a9-ace4-1e988b2c1908" +version = "1.2.0" + +[[deps.OpenAI]] +deps = ["Dates", "HTTP", "JSON3"] +git-tree-sha1 = "fb6a407f3707daf513c4b88f25536dd3dbf94220" +uuid = "e9f21f70-7185-4079-aca2-91159181367c" +version = "0.9.1" + +[[deps.OpenSSL]] +deps = ["BitFlags", "Dates", "MozillaCACerts_jll", "OpenSSL_jll", "Sockets"] +git-tree-sha1 = "38cb508d080d21dc1128f7fb04f20387ed4c0af4" +uuid = "4d8831e6-92b7-49fb-bdf8-b643e874388c" +version = "1.4.3" + +[[deps.OpenSSL_jll]] +deps = ["Artifacts", "JLLWrappers", "Libdl"] +git-tree-sha1 = "7493f61f55a6cce7325f197443aa80d32554ba10" +uuid = "458c3c95-2e84-50aa-8efc-19380b2a3a95" +version = "3.0.15+1" + +[[deps.Parsers]] +deps = ["Dates", "PrecompileTools", "UUIDs"] +git-tree-sha1 = "8489905bcdbcfac64d1daa51ca07c0d8f0283821" +uuid = "69de0a69-1ddd-5017-9359-2bf0b02dc9f0" +version = "2.8.1" + +[[deps.Pkg]] +deps = ["Artifacts", "Dates", "Downloads", "FileWatching", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "Serialization", "TOML", "Tar", "UUIDs", "p7zip_jll"] +uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f" +version = "1.10.0" + +[[deps.PrecompileTools]] +deps = ["Preferences"] +git-tree-sha1 = "5aa36f7049a63a1528fe8f7c3f2113413ffd4e1f" +uuid = "aea7be01-6a6a-4083-8856-8a6e6704d82a" +version = "1.2.1" + +[[deps.Preferences]] +deps = ["TOML"] +git-tree-sha1 = "9306f6085165d270f7e3db02af26a400d580f5c6" +uuid = "21216c6a-2e73-6563-6e65-726566657250" +version = "1.4.3" + +[[deps.Printf]] +deps = ["Unicode"] +uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7" + +[[deps.PromptingTools]] +deps = ["AbstractTrees", "Base64", "Dates", "HTTP", "JSON3", "Logging", "OpenAI", "Pkg", "PrecompileTools", "Preferences", "REPL", "Random", "StreamCallbacks", "Test"] +git-tree-sha1 = "ce00a38af58f71e0b280c2f090fbd4d8a516ce29" +uuid = "670122d1-24a8-4d70-bfce-740807c42192" +version = "0.64.0" + + [deps.PromptingTools.extensions] + FlashRankPromptingToolsExt = ["FlashRank"] + GoogleGenAIPromptingToolsExt = ["GoogleGenAI"] + MarkdownPromptingToolsExt = ["Markdown"] + RAGToolsExperimentalExt = ["SparseArrays", "LinearAlgebra", "Unicode"] + SnowballPromptingToolsExt = ["Snowball"] + + [deps.PromptingTools.weakdeps] + FlashRank = "22cc3f58-1757-4700-bb45-2032706e5a8d" + GoogleGenAI = "903d41d1-eaca-47dd-943b-fee3930375ab" + LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" + Markdown = "d6f4376e-aef5-505a-96c1-9c027394607a" + Snowball = "fb8f903a-0164-4e73-9ffe-431110250c3b" + SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf" + Unicode = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" + +[[deps.REPL]] +deps = ["InteractiveUtils", "Markdown", "Sockets", "Unicode"] +uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb" + +[[deps.Random]] +deps = ["SHA"] +uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c" + +[[deps.SHA]] +uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce" +version = "0.7.0" + +[[deps.Serialization]] +uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b" + +[[deps.SimpleBufferStream]] +git-tree-sha1 = "f305871d2f381d21527c770d4788c06c097c9bc1" +uuid = "777ac1f9-54b0-4bf8-805c-2214025038e7" +version = "1.2.0" + +[[deps.Sockets]] +uuid = "6462fe0b-24de-5631-8697-dd941f90decc" + +[[deps.StreamCallbacks]] +deps = ["HTTP", "JSON3", "PrecompileTools"] +git-tree-sha1 = "827180547dd10f4c018ccdbede9375c76dbdcafe" +uuid = "c1b9e933-98a0-46fc-8ea7-3b58b195fb0a" +version = "0.5.0" + +[[deps.StructTypes]] +deps = ["Dates", "UUIDs"] +git-tree-sha1 = "159331b30e94d7b11379037feeb9b690950cace8" +uuid = "856f2bd8-1eba-4b0a-8007-ebc267875bd4" +version = "1.11.0" + +[[deps.TOML]] +deps = ["Dates"] +uuid = "fa267f1f-6049-4f14-aa54-33bafae1ed76" +version = "1.0.3" + +[[deps.Tar]] +deps = ["ArgTools", "SHA"] +uuid = "a4e569a6-e804-4fa4-b0f3-eef7a1d5b13e" +version = "1.10.0" + +[[deps.Test]] +deps = ["InteractiveUtils", "Logging", "Random", "Serialization"] +uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40" + +[[deps.TranscodingStreams]] +git-tree-sha1 = "0c45878dcfdcfa8480052b6ab162cdd138781742" +uuid = "3bb67fe8-82b1-5028-8e26-92a6c54297fa" +version = "0.11.3" + +[[deps.URIs]] +git-tree-sha1 = "67db6cc7b3821e19ebe75791a9dd19c9b1188f2b" +uuid = "5c2747f8-b7ea-4ff2-ba2e-563bfd36b1d4" +version = "1.5.1" + +[[deps.UUIDs]] +deps = ["Random", "SHA"] +uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4" + +[[deps.Unicode]] +uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" + +[[deps.Zlib_jll]] +deps = ["Libdl"] +uuid = "83775a58-1f1d-513f-b197-d71354ab007a" +version = "1.2.13+1" + +[[deps.nghttp2_jll]] +deps = ["Artifacts", "Libdl"] +uuid = "8e850ede-7688-5339-a07c-302acd2aaf8d" +version = "1.52.0+1" + +[[deps.p7zip_jll]] +deps = ["Artifacts", "Libdl"] +uuid = "3f19e933-33d8-53b3-aaab-bd5110c3b7a0" +version = "17.4.0+2" diff --git a/test/Project.toml b/test/Project.toml new file mode 100644 index 000000000..79fc3bdde --- /dev/null +++ b/test/Project.toml @@ -0,0 +1,52 @@ +[deps] +AbstractTrees = "1520ce14-60c1-5f80-bbc7-55ef81b5835c" +Aqua = "4c88cf16-eb10-579e-8560-4a9242c79595" +Base64 = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f" +Dates = "ade2ca70-3891-5945-98fb-dc099432e06a" +FlashRank = "22cc3f58-1757-4700-bb45-2032706e5a8d" +GoogleGenAI = "903d41d1-eaca-47dd-943b-fee3930375ab" +HTTP = "cd3eb016-35fb-5094-929b-558a96fad6f3" +JSON3 = "0f8b85d8-7281-11e9-16c2-39a750bddbf1" +LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" +Logging = "56ddb016-857b-54e1-b83d-db4d58db5568" +Markdown = "d6f4376e-aef5-505a-96c1-9c027394607a" +OpenAI = "e9f21f70-7185-4079-aca2-91159181367c" +Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f" +PrecompileTools = "aea7be01-6a6a-4083-8856-8a6e6704d82a" +Preferences = "21216c6a-2e73-6563-6e65-726566657250" +PromptingTools = "670122d1-24a8-4d70-bfce-740807c42192" +REPL = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb" +Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c" +Snowball = "fb8f903a-0164-4e73-9ffe-431110250c3b" +SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf" +Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2" +StreamCallbacks = "c1b9e933-98a0-46fc-8ea7-3b58b195fb0a" +Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40" +Unicode = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" + +[compat] +AbstractTrees = "0.4" +Aqua = "0.7" +Base64 = "<0.0.1, 1" +Dates = "<0.0.1, 1" +FlashRank = "0.4" +GoogleGenAI = "0.3" +HTTP = "1.10.8" +JSON3 = "1" +LinearAlgebra = "<0.0.1, 1" +Logging = "<0.0.1, 1" +Markdown = "<0.0.1, 1" +OpenAI = "0.9" +Pkg = "<0.0.1, 1" +PrecompileTools = "1" +Preferences = "1" +PromptingTools = "0.65.0" +REPL = "<0.0.1, 1" +Random = "<0.0.1, 1" +Snowball = "0.1" +SparseArrays = "<0.0.1, 1" +Statistics = "<0.0.1, 1" +StreamCallbacks = "0.4, 0.5" +Test = "<0.0.1, 1" +Unicode = "<0.0.1, 1" +julia = "1.9, 1.10" diff --git a/test/annotation_messages_render.jl b/test/annotation_messages_render.jl new file mode 100644 index 000000000..1f56c2a31 --- /dev/null +++ b/test/annotation_messages_render.jl @@ -0,0 +1,94 @@ +using Test +using PromptingTools +using PromptingTools: OpenAISchema, AnthropicSchema, OllamaSchema, GoogleSchema, TestEchoOpenAISchema, render + +@testset "Annotation Message Rendering" begin + # Create a mix of messages including annotation messages + messages = [ + SystemMessage("Be helpful"), + AnnotationMessage("This is metadata", extras=Dict{Symbol,Any}(:key => "value")), + UserMessage("Hello"), + AnnotationMessage("More metadata"), + AIMessage("Hi there!") + ] + + # Additional edge cases + messages_complex = [ + AnnotationMessage("Metadata 1", extras=Dict{Symbol,Any}(:key => "value")), + AnnotationMessage("Metadata 2", extras=Dict{Symbol,Any}(:key2 => "value2")), + SystemMessage("Be helpful"), + AnnotationMessage("Metadata 3", tags=[:important]), + UserMessage("Hello"), + AnnotationMessage("Metadata 4", comment="For debugging"), + AIMessage("Hi there!"), + AnnotationMessage("Metadata 5", extras=Dict{Symbol,Any}(:key3 => "value3")) + ] + + @testset "Basic Message Filtering" begin + # Test OpenAI Schema with TestEcho + schema = TestEchoOpenAISchema( + response=Dict( + "choices" => [Dict("message" => Dict("content" => "Test response", "role" => "assistant"), "index" => 0, "finish_reason" => "stop")], + "usage" => Dict("prompt_tokens" => 10, "completion_tokens" => 20, "total_tokens" => 30), + "model" => "gpt-3.5-turbo", + "id" => "test-id", + "object" => "chat.completion", + "created" => 1234567890 + ), + status=200 + ) + rendered = render(schema, messages) + @test length(rendered) == 3 # Should only have system, user, and AI messages + @test all(msg["role"] in ["system", "user", "assistant"] for msg in rendered) + @test !any(msg -> contains(msg["content"], "metadata"), rendered) + + # Test Anthropic Schema + rendered = render(AnthropicSchema(), messages) + @test length(rendered.conversation) == 2 # Should have user and AI messages + @test !isnothing(rendered.system) # System message should be preserved separately + @test all(msg["role"] in ["user", "assistant"] for msg in rendered.conversation) + @test !contains(rendered.system, "metadata") # Check system message + @test !any(msg -> any(content -> contains(content["text"], "metadata"), msg["content"]), rendered.conversation) + + # Test Ollama Schema + rendered = render(OllamaSchema(), messages) + @test length(rendered) == 3 # Should only have system, user, and AI messages + @test all(msg["role"] in ["system", "user", "assistant"] for msg in rendered) + @test !any(msg -> contains(msg["content"], "metadata"), rendered) + + # Test Google Schema + rendered = render(GoogleSchema(), messages) + @test length(rendered) == 2 # Google schema combines system message with first user message + @test all(msg[:role] in ["user", "model"] for msg in rendered) # Google uses "model" instead of "assistant" + @test !any(msg -> any(part -> contains(part["text"], "metadata"), msg[:parts]), rendered) + end + + @testset "Complex Edge Cases" begin + # Test with multiple consecutive annotation messages + for schema in [TestEchoOpenAISchema(), AnthropicSchema(), OllamaSchema(), GoogleSchema()] + rendered = render(schema, messages_complex) + + if schema isa AnthropicSchema + @test length(rendered.conversation) == 2 # user and AI only + @test !isnothing(rendered.system) # system preserved + else + @test length(rendered) == (schema isa GoogleSchema ? 2 : 3) # Google schema combines system with user message + end + + # Test no metadata leaks through + for i in 1:5 + if schema isa GoogleSchema + # Google schema uses a different structure + @test !any(msg -> any(part -> contains(part["text"], "Metadata $i"), msg[:parts]), rendered) + elseif schema isa AnthropicSchema + # Check each message's content array for metadata + @test !any(msg -> any(content -> contains(content["text"], "Metadata $i"), msg["content"]), rendered.conversation) + @test !contains(rendered.system, "Metadata $i") + else + # OpenAI and Ollama schemas + @test !any(msg -> contains(msg["content"], "Metadata $i"), rendered) + end + end + end + end +end diff --git a/test/messages.jl b/test/messages.jl index 2ece68c37..6b26d053f 100644 --- a/test/messages.jl +++ b/test/messages.jl @@ -1,10 +1,10 @@ -using PromptingTools: AIMessage, SystemMessage, MetadataMessage, AbstractMessage +using PromptingTools: AIMessage, SystemMessage, MetadataMessage, AbstractMessage, AbstractAnnotationMessage using PromptingTools: UserMessage, UserMessageWithImages, DataMessage, AIToolRequest, ToolMessage using PromptingTools: _encode_local_image, attach_images_to_user_message, last_message, last_output, tool_calls using PromptingTools: isusermessage, issystemmessage, isdatamessage, isaimessage, - istracermessage, isaitoolrequest, istoolmessage + istracermessage, isaitoolrequest, istoolmessage, isabstractannotationmessage using PromptingTools: TracerMessageLike, TracerMessage, align_tracer!, unwrap, AbstractTracerMessage, AbstractTracer, pprint using PromptingTools: TracerSchema, SaverSchema @@ -261,6 +261,50 @@ end @test occursin("Int64", output) end +@testset "AnnotationMessage" begin + # Basic construction + content = "Test annotation" + comment = "For testing purposes" + tags = [:test, :example] + extras = Dict(:key1 => "value1", :key2 => 42) + + msg = AnnotationMessage(content; comment, tags, extras) + @test msg.content == content + @test msg.comment == comment + @test msg.tags == tags + @test msg.extras == extras + @test isabstractannotationmessage(msg) + + # Test show method + io = IOBuffer() + show(io, MIME("text/plain"), msg) + output = String(take!(io)) + @test occursin("AnnotationMessage", output) + @test occursin("Test annotation", output) + @test occursin("test, example", output) + + # Test pprint + pprint(io, msg) + output = String(take!(io)) + @test occursin("Annotation Message", output) + @test occursin("Content: Test annotation", output) + @test occursin("Tags: [:test, :example]", output) + + # Test annotate! utility + msgs = [UserMessage("Hello"), AIMessage("Hi")] + annotated = annotate!(msgs, "Annotation"; tags=[:conversation]) + @test length(annotated) == 3 + @test isabstractannotationmessage(annotated[1]) + @test annotated[1].tags == [:conversation] + + # Test multiple annotations + another_annotation = AnnotationMessage("Another note") + push!(msgs, another_annotation) + annotated = annotate!(msgs, "New annotation") + @test count(isabstractannotationmessage, annotated) == 2 + @test findall(isabstractannotationmessage, annotated) == [1, 2] +end + @testset "TracerMessage,TracerMessageLike" begin # Tracer functionality msg1 = UserMessage("Hi") diff --git a/test/runtests.jl b/test/runtests.jl index 930a83861..84c00db91 100644 --- a/test/runtests.jl +++ b/test/runtests.jl @@ -1,12 +1,13 @@ using PromptingTools +using Test, Pkg +# Ensure test dependencies are loaded +Pkg.activate("test") +Pkg.instantiate() +using Aqua using OpenAI, HTTP, JSON3 using SparseArrays, LinearAlgebra, Markdown using Statistics using Dates: now -using Test, Pkg, Random -const PT = PromptingTools -using Snowball, FlashRank -using Aqua @testset "Code quality (Aqua.jl)" begin # Skipping unbound_args check because we need our `MaybeExtract` type to be unboard diff --git a/test/test_annotation_messages.jl b/test/test_annotation_messages.jl new file mode 100644 index 000000000..4db9c5c2c --- /dev/null +++ b/test/test_annotation_messages.jl @@ -0,0 +1,162 @@ +using Test +using PromptingTools +using PromptingTools: TestEchoOpenAISchema, render, SystemMessage, UserMessage, AIMessage, AnnotationMessage +using PromptingTools: OpenAISchema, AnthropicSchema, OllamaSchema, GoogleSchema + +@testset "AnnotationMessage" begin + # Test creation and basic properties + @testset "Basic Construction" begin + msg = AnnotationMessage(content="Test content") + @test msg.content == "Test content" + @test isempty(msg.extras) + @test !isnothing(msg.run_id) + end + + # Test with all fields + @testset "Full Construction" begin + msg = AnnotationMessage( + content="Full test", + extras=Dict{Symbol,Any}(:key => "value"), + tags=[:test, :example], + comment="Test comment" + ) + @test msg.content == "Full test" + @test msg.extras[:key] == "value" + @test msg.tags == [:test, :example] + @test msg.comment == "Test comment" + end + + # Test annotate! utility + @testset "annotate! utility" begin + # Test with vector of messages + messages = [SystemMessage("System"), UserMessage("User")] + annotated = annotate!(messages, "Annotation") + @test length(annotated) == 3 + @test annotated[1] isa AnnotationMessage + @test annotated[1].content == "Annotation" + + # Test with single message + message = UserMessage("Single") + annotated = annotate!(message, "Single annotation") + @test length(annotated) == 2 + @test annotated[1] isa AnnotationMessage + @test annotated[1].content == "Single annotation" + + # Test annotation placement with existing annotations + messages = [ + AnnotationMessage("First"), + SystemMessage("System"), + UserMessage("User") + ] + annotated = annotate!(messages, "Second") + @test length(annotated) == 4 + @test annotated[2] isa AnnotationMessage + @test annotated[2].content == "Second" + end + + # Test serialization + @testset "Serialization" begin + original = AnnotationMessage( + content="Test", + extras=Dict{Symbol,Any}(:key => "value"), + tags=[:test], + comment="Comment" + ) + + # Convert to Dict and back + dict = Dict(original) + reconstructed = convert(AnnotationMessage, dict) + + @test reconstructed.content == original.content + @test reconstructed.extras == original.extras + @test reconstructed.tags == original.tags + @test reconstructed.comment == original.comment + end + + # Test rendering skipping across all providers + @testset "Render Skipping" begin + # Create a mix of messages including annotation messages + messages = [ + SystemMessage("Be helpful"), + AnnotationMessage("This is metadata", extras=Dict{Symbol,Any}(:key => "value")), + UserMessage("Hello"), + AnnotationMessage("More metadata"), + AIMessage("Hi there!") + ] + + # Additional edge cases + messages_complex = [ + AnnotationMessage("Metadata 1", extras=Dict{Symbol,Any}(:key => "value")), + AnnotationMessage("Metadata 2", extras=Dict{Symbol,Any}(:key2 => "value2")), + SystemMessage("Be helpful"), + AnnotationMessage("Metadata 3", tags=[:important]), + UserMessage("Hello"), + AnnotationMessage("Metadata 4", comment="For debugging"), + AIMessage("Hi there!"), + AnnotationMessage("Metadata 5", extras=Dict{Symbol,Any}(:key3 => "value3")) + ] + + # Test OpenAI Schema with TestEcho + schema = TestEchoOpenAISchema( + response=Dict( + "choices" => [Dict("message" => Dict("content" => "Test response", "role" => "assistant"), "index" => 0, "finish_reason" => "stop")], + "usage" => Dict("prompt_tokens" => 10, "completion_tokens" => 20, "total_tokens" => 30), + "model" => "gpt-3.5-turbo", + "id" => "test-id", + "object" => "chat.completion", + "created" => 1234567890 + ), + status=200 + ) + rendered = render(schema, messages) + @test length(rendered) == 3 # Should only have system, user, and AI messages + @test all(msg["role"] in ["system", "user", "assistant"] for msg in rendered) + @test !any(msg -> contains(msg["content"], "metadata"), rendered) + + # Test Anthropic Schema + rendered = render(AnthropicSchema(), messages) + @test length(rendered.conversation) == 2 # Should have user and AI messages + @test !isnothing(rendered.system) # System message should be preserved separately + @test all(msg["role"] in ["user", "assistant"] for msg in rendered.conversation) + @test !contains(rendered.system, "metadata") # Check system message + @test !any(msg -> any(content -> contains(content["text"], "metadata"), msg["content"]), rendered.conversation) + + # Test Ollama Schema + rendered = render(OllamaSchema(), messages) + @test length(rendered) == 3 # Should only have system, user, and AI messages + @test all(msg["role"] in ["system", "user", "assistant"] for msg in rendered) + @test !any(msg -> contains(msg["content"], "metadata"), rendered) + + # Test Google Schema + rendered = render(GoogleSchema(), messages) + @test length(rendered) == 2 # Google schema combines system message with first user message + @test all(msg[:role] in ["user", "model"] for msg in rendered) # Google uses "model" instead of "assistant" + @test !any(msg -> any(part -> contains(part["text"], "metadata"), msg[:parts]), rendered) + + # Test complex edge cases + @testset "Complex Edge Cases" begin + for schema in [TestEchoOpenAISchema(), AnthropicSchema(), OllamaSchema(), GoogleSchema()] + rendered = render(schema, messages_complex) + + if schema isa AnthropicSchema + @test length(rendered.conversation) == 2 # user and AI only + @test !isnothing(rendered.system) # system preserved + else + @test length(rendered) == (schema isa GoogleSchema ? 2 : 3) # Google schema combines system with user message + end + + # Test no metadata leaks through + for i in 1:5 + if schema isa GoogleSchema + @test !any(msg -> any(part -> contains(part["text"], "Metadata $i"), msg[:parts]), rendered) + elseif schema isa AnthropicSchema + @test !any(msg -> any(content -> contains(content["text"], "Metadata $i"), msg["content"]), rendered.conversation) + @test !contains(rendered.system, "Metadata $i") + else + @test !any(msg -> contains(msg["content"], "Metadata $i"), rendered) + end + end + end + end + end +end