feat(ai): improve analytics report (#12924)

Add new AI analytics into the PING anonymous report Co-authored-by: Jack Tysoe <[email protected]>
Kong · Apr 26, 2024 · c6a8ef8 · c6a8ef8 · github-actions · Apr 26, 2024
1 parent 3980a63
commit c6a8ef8
Show file tree

Hide file tree

Showing 4 changed files with 279 additions and 2 deletions.
diff --git a/changelog/unreleased/kong/add-ai-data-report.yml b/changelog/unreleased/kong/add-ai-data-report.yml
@@ -0,0 +1,3 @@
+"message": Add `events:ai:response_tokens`, `events:ai:prompt_tokens` and `events:ai:requests` to the anonymous report to start counting AI usage
+"type": feature
+"scope": Core
diff --git a/kong/init.lua b/kong/init.lua
@@ -233,6 +233,9 @@ do
  "events:streams",
  "events:streams:tcp",
  "events:streams:tls",
+ "events:ai:response_tokens",
+ "events:ai:prompt_tokens",
+ "events:ai:requests",
  }
 
  reset_kong_shm = function(config)

diff --git a/kong/reports.lua b/kong/reports.lua
@@ -53,6 +53,11 @@ local GO_PLUGINS_REQUEST_COUNT_KEY = "events:requests:go_plugins"
 local WASM_REQUEST_COUNT_KEY = "events:requests:wasm"
 
 
+local AI_RESPONSE_TOKENS_COUNT_KEY = "events:ai:response_tokens"
+local AI_PROMPT_TOKENS_COUNT_KEY = "events:ai:prompt_tokens"
+local AI_REQUEST_COUNT_KEY = "events:ai:requests"
+
+
 local ROUTE_CACHE_HITS_KEY = "route_cache_hits"
 local STEAM_ROUTE_CACHE_HITS_KEY_POS = STREAM_COUNT_KEY .. ":" .. ROUTE_CACHE_HITS_KEY .. ":pos"
 local STEAM_ROUTE_CACHE_HITS_KEY_NEG = STREAM_COUNT_KEY .. ":" .. ROUTE_CACHE_HITS_KEY .. ":neg"
@@ -240,8 +245,12 @@ local function reset_counter(key, amount)
 end
 
 
-local function incr_counter(key)
- local ok, err = report_counter:incr(key, 1)
+local function incr_counter(key, hit)
+ if not hit then 
+ hit = 1
+ end
+
+ local ok, err = report_counter:incr(key, hit)
  if not ok then
  log(WARN, "could not increment ", key, " in 'kong' shm: ", err)
  end
@@ -327,6 +336,10 @@ local function send_ping(host, port)
  _ping_infos.stream_route_cache_hit_pos = get_counter(STEAM_ROUTE_CACHE_HITS_KEY_POS)
  _ping_infos.stream_route_cache_hit_neg = get_counter(STEAM_ROUTE_CACHE_HITS_KEY_NEG)
 
+ _ping_infos.ai_response_tokens = get_counter(AI_RESPONSE_TOKENS_COUNT_KEY)
+ _ping_infos.ai_prompt_tokens = get_counter(AI_PROMPT_TOKENS_COUNT_KEY)
+ _ping_infos.ai_reqs = get_counter(AI_REQUEST_COUNT_KEY)
+
  send_report("ping", _ping_infos, host, port)
 
  reset_counter(STREAM_COUNT_KEY, _ping_infos.streams)
@@ -337,6 +350,9 @@ local function send_ping(host, port)
  reset_counter(WASM_REQUEST_COUNT_KEY, _ping_infos.wasm_reqs)
  reset_counter(STEAM_ROUTE_CACHE_HITS_KEY_POS, _ping_infos.stream_route_cache_hit_pos)
  reset_counter(STEAM_ROUTE_CACHE_HITS_KEY_NEG, _ping_infos.stream_route_cache_hit_neg)
+ reset_counter(AI_RESPONSE_TOKENS_COUNT_KEY, _ping_infos.ai_response_tokens)
+ reset_counter(AI_PROMPT_TOKENS_COUNT_KEY, _ping_infos.ai_prompt_tokens)
+ reset_counter(AI_REQUEST_COUNT_KEY, _ping_infos.ai_reqs)
  return
  end
 
@@ -353,6 +369,10 @@ local function send_ping(host, port)
  _ping_infos.go_plugin_reqs = get_counter(GO_PLUGINS_REQUEST_COUNT_KEY)
  _ping_infos.wasm_reqs = get_counter(WASM_REQUEST_COUNT_KEY)
 
+ _ping_infos.ai_response_tokens = get_counter(AI_RESPONSE_TOKENS_COUNT_KEY)
+ _ping_infos.ai_prompt_tokens = get_counter(AI_PROMPT_TOKENS_COUNT_KEY)
+ _ping_infos.ai_reqs = get_counter(AI_REQUEST_COUNT_KEY)
+
  _ping_infos.request_route_cache_hit_pos = get_counter(REQUEST_ROUTE_CACHE_HITS_KEY_POS)
  _ping_infos.request_route_cache_hit_neg = get_counter(REQUEST_ROUTE_CACHE_HITS_KEY_NEG)
 
@@ -372,6 +392,9 @@ local function send_ping(host, port)
  reset_counter(WASM_REQUEST_COUNT_KEY, _ping_infos.wasm_reqs)
  reset_counter(REQUEST_ROUTE_CACHE_HITS_KEY_POS, _ping_infos.request_route_cache_hit_pos)
  reset_counter(REQUEST_ROUTE_CACHE_HITS_KEY_NEG, _ping_infos.request_route_cache_hit_neg)
+ reset_counter(AI_RESPONSE_TOKENS_COUNT_KEY, _ping_infos.ai_response_tokens)
+ reset_counter(AI_PROMPT_TOKENS_COUNT_KEY, _ping_infos.ai_prompt_tokens)
+ reset_counter(AI_REQUEST_COUNT_KEY, _ping_infos.ai_reqs)
 end
 
 
@@ -496,6 +519,15 @@ return {
  incr_counter(WASM_REQUEST_COUNT_KEY)
  end
 
+ if kong.ctx.shared.ai_prompt_tokens then
+ incr_counter(AI_REQUEST_COUNT_KEY)
+ incr_counter(AI_PROMPT_TOKENS_COUNT_KEY, kong.ctx.shared.ai_prompt_tokens)
+ end
+
+ if kong.ctx.shared.ai_response_tokens then
+ incr_counter(AI_RESPONSE_TOKENS_COUNT_KEY, kong.ctx.shared.ai_response_tokens)
+ end
+
  local suffix = get_current_suffix(ctx)
  if suffix then
  incr_counter(count_key .. ":" .. suffix)

diff --git a/spec/02-integration/22-ai_plugins/01-reports_spec.lua b/spec/02-integration/22-ai_plugins/01-reports_spec.lua
@@ -0,0 +1,239 @@
+local helpers = require "spec.helpers"
+local constants = require "kong.constants"
+local cjson = require "cjson"
+local pl_file = require "pl.file"
+
+local PLUGIN_NAME = "ai-proxy"
+local MOCK_PORT = helpers.get_available_port()
+
+for _, strategy in helpers.each_strategy() do
+ local admin_client
+ local dns_hostsfile
+ local reports_server
+
+ describe("anonymous reports for ai plugins #" .. strategy, function()
+ local reports_send_ping = function(port)
+ assert.eventually(function()
+ admin_client = helpers.admin_client()
+ local res = admin_client:post("/reports/send-ping" .. (port and "?port=" .. port or ""))
+ assert.response(res).has_status(200)
+ admin_client:close()
+ end)
+ .has_no_error("ping request was sent successfully")
+ end
+
+ lazy_setup(function()
+ dns_hostsfile = assert(os.tmpname() .. ".hosts")
+ local fd = assert(io.open(dns_hostsfile, "w"))
+ assert(fd:write("127.0.0.1 " .. constants.REPORTS.ADDRESS))
+ assert(fd:close())
+
+ local bp = assert(helpers.get_db_utils(strategy, {
+ "services",
+ "routes",
+ "plugins",
+ }, { "reports-api" }))
+
+ -- set up openai mock fixtures
+ local fixtures = {
+ http_mock = {},
+ }
+
+ fixtures.http_mock.openai = [[
+ server {
+ server_name openai;
+ listen ]]..MOCK_PORT..[[;
+ 
+ default_type 'application/json';
+ 
+ 
+ location = "/llm/v1/chat/good" {
+ content_by_lua_block {
+ local pl_file = require "pl.file"
+ local json = require("cjson.safe")
+ 
+ ngx.req.read_body()
+ local body, err = ngx.req.get_body_data()
+ body, err = json.decode(body)
+ 
+ local token = ngx.req.get_headers()["authorization"]
+ local token_query = ngx.req.get_uri_args()["apikey"]
+ 
+ if token == "Bearer openai-key" or token_query == "openai-key" or body.apikey == "openai-key" then
+ ngx.req.read_body()
+ local body, err = ngx.req.get_body_data()
+ body, err = json.decode(body)
+ 
+ if err or (body.messages == ngx.null) then
+ ngx.status = 400
+ ngx.print(pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/responses/bad_request.json"))
+ else
+ ngx.status = 200
+ ngx.print(pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/responses/good.json"))
+ end
+ else
+ ngx.status = 401
+ ngx.print(pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/responses/unauthorized.json"))
+ end
+ }
+ }
+ }
+ ]]
+
+ local http_srv = assert(bp.services:insert {
+ name = "mock-service",
+ host = helpers.mock_upstream_host,
+ port = helpers.mock_upstream_port,
+ })
+
+ local chat_good = assert(bp.routes:insert {
+ service = http_srv,
+ protocols = { "http" },
+ hosts = { "http-service.test" }
+ })
+
+ local chat_good_2 = assert(bp.routes:insert {
+ service = http_srv,
+ protocols = { "http" },
+ hosts = { "http-service.test_2" }
+ })
+
+ bp.plugins:insert({
+ name = "reports-api",
+ config = {}
+ })
+
+ bp.plugins:insert {
+ name = PLUGIN_NAME,
+ route = { id = chat_good.id },
+ config = {
+ route_type = "llm/v1/chat",
+ logging = {
+ log_payloads = false,
+ log_statistics = true,
+ },
+ auth = {
+ header_name = "Authorization",
+ header_value = "Bearer openai-key",
+ },
+ model = {
+ name = "gpt-3.5-turbo",
+ provider = "openai",
+ options = {
+ max_tokens = 256,
+ temperature = 1.0,
+ upstream_url = "http://"..helpers.mock_upstream_host..":"..MOCK_PORT.."/llm/v1/chat/good"
+ },
+ },
+ },
+ }
+
+ bp.plugins:insert {
+ name = PLUGIN_NAME,
+ route = { id = chat_good_2.id },
+ config = {
+ route_type = "llm/v1/chat",
+ logging = {
+ log_payloads = false,
+ log_statistics = false, -- should work also for statistics disable
+ },
+ auth = {
+ header_name = "Authorization",
+ header_value = "Bearer openai-key",
+ },
+ model = {
+ name = "gpt-3.5-turbo",
+ provider = "openai",
+ options = {
+ max_tokens = 256,
+ temperature = 1.0,
+ upstream_url = "http://"..helpers.mock_upstream_host..":"..MOCK_PORT.."/llm/v1/chat/good"
+ },
+ },
+ },
+ }
+
+ assert(helpers.start_kong({
+ nginx_conf = "spec/fixtures/custom_nginx.template",
+ database = strategy,
+ dns_hostsfile = dns_hostsfile,
+ plugins = "bundled,reports-api",
+ anonymous_reports = true,
+ }, nil, nil, fixtures))
+
+ end)
+
+ lazy_teardown(function()
+ os.remove(dns_hostsfile)
+
+ helpers.stop_kong()
+ end)
+
+ before_each(function()
+ reports_server = helpers.tcp_server(constants.REPORTS.STATS_TLS_PORT, {tls=true})
+ end)
+
+ describe("check report has ai data", function()
+ it("logs correct data for report on a request triggering a ai plugin", function()
+ local proxy_client = assert(helpers.proxy_client())
+ local res = proxy_client:get("/", {
+ headers = { 
+ ["content-type"] = "application/json",
+ ["accept"] = "application/json",
+ ["host"] = "http-service.test",
+ },
+ body = pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/requests/good.json"),
+ })
+ assert.res_status(200, res)
+
+ reports_send_ping(constants.REPORTS.STATS_TLS_PORT)
+
+ proxy_client:close()
+
+ local _, reports_data = assert(reports_server:join())
+ reports_data = cjson.encode(reports_data)
+
+ assert.match("ai_response_tokens=8", reports_data)
+ assert.match("ai_prompt_tokens=10", reports_data)
+ assert.match("ai_reqs=1", reports_data)
+ end)
+
+ it("logs correct data for a different routes triggering a ai plugin", function()
+ local proxy_client = assert(helpers.proxy_client())
+ local res = proxy_client:get("/", {
+ headers = { 
+ ["content-type"] = "application/json",
+ ["accept"] = "application/json",
+ ["host"] = "http-service.test",
+ },
+ body = pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/requests/good.json"),
+ })
+ assert.res_status(200, res)
+
+ local proxy_client_2 = assert(helpers.proxy_client())
+ local res_2 = proxy_client_2:get("/", {
+ headers = { 
+ ["content-type"] = "application/json",
+ ["accept"] = "application/json",
+ ["host"] = "http-service.test_2",
+ },
+ body = pl_file.read("spec/fixtures/ai-proxy/openai/llm-v1-chat/requests/good.json"),
+ })
+ assert.res_status(200, res_2)
+
+ reports_send_ping(constants.REPORTS.STATS_TLS_PORT)
+
+ proxy_client:close()
+ proxy_client_2:close()
+
+ local _, reports_data = assert(reports_server:join())
+ reports_data = cjson.encode(reports_data)
+
+ assert.match("ai_response_tokens=16", reports_data)
+ assert.match("ai_prompt_tokens=20", reports_data)
+ assert.match("ai_reqs=2", reports_data)
+ end)
+ end)
+
+ end)
+end