mirror of
https://gh.wpcy.net/https://github.com/discourse/discourse.git
synced 2026-06-19 04:03:45 +08:00
226 lines
6.8 KiB
Ruby
Vendored
226 lines
6.8 KiB
Ruby
Vendored
# frozen_string_literal: true
|
|
|
|
module DiscourseAi
|
|
module AiBot
|
|
class ResponseHttpStreamer
|
|
CRLF = "\r\n"
|
|
POOL_SIZE = 10
|
|
|
|
class << self
|
|
def thread_pool
|
|
# we use our thread pool implementation here for a few reasons:
|
|
#
|
|
# 1. Free multisite support
|
|
# 2. Unlike Concurrent::CachedThreadPool, we spin back down to 0 threads automatiaclly see: https://github.com/ruby-concurrency/concurrent-ruby/issues/1075
|
|
# 3. Better internal error handling
|
|
@thread_pool ||=
|
|
Scheduler::ThreadPool.new(min_threads: 0, max_threads: POOL_SIZE, idle_time: 30)
|
|
end
|
|
|
|
def schedule_block(&block)
|
|
thread_pool.post do
|
|
block.call
|
|
rescue StandardError => e
|
|
Discourse.warn_exception(e, message: "Discourse AI: Unable to stream reply")
|
|
end
|
|
end
|
|
|
|
# keeping this in a static method so we don't capture ENV and other bits
|
|
# this allows us to release memory earlier
|
|
def queue_streamed_reply(
|
|
io:,
|
|
agent:,
|
|
user:,
|
|
topic:,
|
|
query:,
|
|
custom_instructions:,
|
|
current_user:,
|
|
custom_tools: nil,
|
|
resume_token: nil,
|
|
tool_results: nil
|
|
)
|
|
schedule_block do
|
|
if custom_tools.present? || resume_token.present?
|
|
stream_custom_tool_reply(
|
|
io: io,
|
|
agent: agent,
|
|
user: user,
|
|
topic: topic,
|
|
query: query,
|
|
custom_instructions: custom_instructions,
|
|
current_user: current_user,
|
|
custom_tools: custom_tools,
|
|
resume_token: resume_token,
|
|
tool_results: tool_results,
|
|
)
|
|
else
|
|
stream_standard_reply(
|
|
io: io,
|
|
agent: agent,
|
|
user: user,
|
|
topic: topic,
|
|
query: query,
|
|
custom_instructions: custom_instructions,
|
|
current_user: current_user,
|
|
)
|
|
end
|
|
rescue StandardError => e
|
|
# make it a tiny bit easier to debug in dev, this is tricky
|
|
# multi-threaded code that exhibits various limitations in rails
|
|
p e if Rails.env.local?
|
|
Discourse.warn_exception(e, message: "Discourse AI: Unable to stream reply")
|
|
ensure
|
|
io.close
|
|
end
|
|
end
|
|
|
|
def stream_standard_reply(
|
|
io:,
|
|
agent:,
|
|
user:,
|
|
topic:,
|
|
query:,
|
|
custom_instructions:,
|
|
current_user:
|
|
)
|
|
post_params = {
|
|
raw: query,
|
|
skip_validations: true,
|
|
custom_fields: {
|
|
DiscourseAi::AiBot::Playground::BYPASS_AI_REPLY_CUSTOM_FIELD => true,
|
|
},
|
|
}
|
|
|
|
if topic
|
|
post_params[:topic_id] = topic.id
|
|
else
|
|
post_params[:title] = I18n.t("discourse_ai.ai_bot.default_pm_prefix")
|
|
post_params[:archetype] = Archetype.private_message
|
|
post_params[:target_usernames] = "#{user.username},#{agent.user.username}"
|
|
end
|
|
|
|
post = PostCreator.create!(user, post_params)
|
|
topic = post.topic
|
|
|
|
write_headers(io)
|
|
|
|
agent_class = DiscourseAi::Agents::Agent.find_by(id: agent.id, user: current_user)
|
|
bot = DiscourseAi::Agents::Bot.as(agent.user, agent: agent_class.new)
|
|
|
|
write_chunk(io, { topic_id: topic.id, bot_user_id: agent.user.id, agent_id: agent.id })
|
|
|
|
DiscourseAi::AiBot::Playground
|
|
.new(bot)
|
|
.reply_to(post, custom_instructions: custom_instructions) do |partial|
|
|
next if partial.empty?
|
|
|
|
write_chunk(io, { partial: partial })
|
|
end
|
|
|
|
finish_chunks(io)
|
|
end
|
|
|
|
def stream_custom_tool_reply(
|
|
io:,
|
|
agent:,
|
|
user:,
|
|
topic:,
|
|
query:,
|
|
custom_instructions:,
|
|
current_user:,
|
|
custom_tools:,
|
|
resume_token:,
|
|
tool_results:
|
|
)
|
|
# Custom-tool streams always report errors in-band using error events once headers
|
|
# have been emitted.
|
|
write_headers(io)
|
|
|
|
session =
|
|
DiscourseAi::AiBot::StreamReplyCustomToolsSession.new(
|
|
agent: agent,
|
|
user: user,
|
|
topic: topic,
|
|
query: query,
|
|
custom_instructions: custom_instructions,
|
|
current_user: current_user,
|
|
custom_tools: custom_tools,
|
|
resume_token: resume_token,
|
|
tool_results: tool_results,
|
|
)
|
|
|
|
session.run do |event_type, payload|
|
|
if event_type == :partial
|
|
write_chunk(io, { partial: payload })
|
|
else
|
|
write_chunk(io, payload)
|
|
end
|
|
end
|
|
|
|
finish_chunks(io)
|
|
rescue DiscourseAi::AiBot::StreamReplyCustomToolsSession::ProtocolError => e
|
|
Discourse.warn_exception(
|
|
e,
|
|
message: "Discourse AI: Stream reply custom tool protocol error",
|
|
)
|
|
write_chunk(io, { event: "error", error: e.message })
|
|
finish_chunks(io)
|
|
rescue StandardError => e
|
|
# Headers were already sent. Emit an error frame and chunk terminator so clients can
|
|
# safely parse this as a completed stream, then re-raise for centralized logging.
|
|
begin
|
|
write_chunk(
|
|
io,
|
|
{
|
|
event: "error",
|
|
error: I18n.t("discourse_ai.errors.stream_reply_unexpected_error"),
|
|
},
|
|
)
|
|
finish_chunks(io)
|
|
rescue StandardError
|
|
end
|
|
raise e
|
|
end
|
|
|
|
def write_headers(io)
|
|
io.write "HTTP/1.1 200 OK"
|
|
io.write CRLF
|
|
io.write "Content-Type: text/plain; charset=utf-8"
|
|
io.write CRLF
|
|
io.write "Transfer-Encoding: chunked"
|
|
io.write CRLF
|
|
io.write "Cache-Control: no-cache, no-store, must-revalidate"
|
|
io.write CRLF
|
|
io.write "Connection: close"
|
|
io.write CRLF
|
|
io.write "X-Accel-Buffering: no"
|
|
io.write CRLF
|
|
io.write "X-Content-Type-Options: nosniff"
|
|
io.write CRLF
|
|
io.write CRLF
|
|
io.flush
|
|
end
|
|
|
|
def write_chunk(io, payload)
|
|
data = payload.to_json + "\n\n"
|
|
data.force_encoding("UTF-8")
|
|
|
|
io.write data.bytesize.to_s(16)
|
|
io.write CRLF
|
|
io.write data
|
|
io.write CRLF
|
|
io.flush
|
|
end
|
|
|
|
def finish_chunks(io)
|
|
io.write "0"
|
|
io.write CRLF
|
|
io.write CRLF
|
|
|
|
io.flush
|
|
io.done if io.respond_to?(:done)
|
|
end
|
|
end
|
|
end
|
|
end
|
|
end
|