| # |
| # Licensed to the Apache Software Foundation (ASF) under one or more |
| # contributor license agreements. See the NOTICE file distributed with |
| # this work for additional information regarding copyright ownership. |
| # The ASF licenses this file to You under the Apache License, Version 2.0 |
| # (the "License"); you may not use this file except in compliance with |
| # the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| # |
| |
| BEGIN { |
| $ENV{TEST_ENABLE_CONTROL_API_V1} = "0"; |
| } |
| |
| use t::APISIX 'no_plan'; |
| |
| log_level("info"); |
| repeat_each(1); |
| no_long_string(); |
| no_shuffle(); |
| no_root_location(); |
| |
| add_block_preprocessor(sub { |
| my ($block) = @_; |
| |
| if (!defined $block->request) { |
| $block->set_value("request", "GET /t"); |
| } |
| }); |
| |
| run_tests(); |
| |
| __DATA__ |
| |
| === TEST 1: schema validation - expression strategy requires cost_expr |
| --- config |
| location /t { |
| content_by_lua_block { |
| local plugin = require("apisix.plugins.ai-rate-limiting") |
| local configs = { |
| -- expression without cost_expr |
| { |
| limit = 100, |
| time_window = 60, |
| limit_strategy = "expression", |
| }, |
| -- expression with empty cost_expr |
| { |
| limit = 100, |
| time_window = 60, |
| limit_strategy = "expression", |
| cost_expr = "", |
| }, |
| -- expression with invalid cost_expr syntax |
| { |
| limit = 100, |
| time_window = 60, |
| limit_strategy = "expression", |
| cost_expr = "invalid $$$ syntax %%%", |
| }, |
| -- valid expression |
| { |
| limit = 100, |
| time_window = 60, |
| limit_strategy = "expression", |
| cost_expr = "input_tokens + output_tokens", |
| }, |
| -- valid complex expression |
| { |
| limit = 100, |
| time_window = 60, |
| limit_strategy = "expression", |
| cost_expr = "(input_tokens - cache_read_input_tokens) + cache_creation_input_tokens * 1.25 + output_tokens", |
| }, |
| } |
| for i, conf in ipairs(configs) do |
| local ok, err = plugin.check_schema(conf) |
| if ok then |
| ngx.say("config " .. i .. ": valid") |
| else |
| ngx.say("config " .. i .. ": invalid") |
| end |
| end |
| } |
| } |
| --- response_body |
| config 1: invalid |
| config 2: invalid |
| config 3: invalid |
| config 4: valid |
| config 5: valid |
| |
| |
| |
| === TEST 2: set route with expression rate limiting (non-streaming, native Anthropic) |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 500, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens + cache_creation_input_tokens + output_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 3: non-streaming request - expression counts input_tokens + cache_creation + output_tokens |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-with-cache.json |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- response_headers_like eval |
| [ |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 500", |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 320", |
| ] |
| --- no_error_log |
| [error] |
| |
| |
| |
| === TEST 4: set route with expression rate limiting (streaming, native Anthropic) |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 500, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens + cache_creation_input_tokens + output_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 5: streaming request - verify token usage accumulation and rate limiting |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-streaming-with-cache.sse |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"stream":true,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"stream":true,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- response_headers_like eval |
| [ |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 500", |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 320", |
| ] |
| --- no_error_log |
| [error] |
| |
| |
| |
| === TEST 6: set route with cache-aware ITPM expression (excludes cache_read_input_tokens) |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 100, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens + cache_creation_input_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 7: cache-aware ITPM - cost=150 exceeds limit=100 after first request, second rejected |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-with-cache.json |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- error_code eval |
| [200, 503] |
| --- no_error_log |
| [error] |
| |
| |
| |
| === TEST 8: set route with weighted expression (cache_read costs 10%, cache_creation costs 125%) |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 1000, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens + cache_read_input_tokens * 0.1 + cache_creation_input_tokens * 1.25 + output_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 9: weighted expression - two requests (cost = 50 + 200*0.1 + 100*1.25 + 30 = 225 each) |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-with-cache.json |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- response_headers_like eval |
| [ |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 1000", |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 775", |
| ] |
| --- no_error_log |
| [error] |
| |
| |
| |
| === TEST 10: expression with missing variables defaults to 0 |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 500, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens + nonexistent_field + output_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 11: missing variable defaults to 0 - cost = 50 + 0 + 30 = 80 per request |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-with-cache.json |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- response_headers_like eval |
| [ |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 500", |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 420", |
| ] |
| --- no_error_log |
| [error] |
| |
| |
| |
| === TEST 12: set route with expression that can yield negative cost |
| --- config |
| location /t { |
| content_by_lua_block { |
| local t = require("lib.test_admin").test |
| local code, body = t('/apisix/admin/routes/1', |
| ngx.HTTP_PUT, |
| [[{ |
| "uri": "/v1/messages", |
| "plugins": { |
| "ai-proxy": { |
| "provider": "anthropic", |
| "auth": { |
| "header": { |
| "x-api-key": "test-key", |
| "anthropic-version": "2023-06-01" |
| } |
| }, |
| "options": { |
| "model": "claude-sonnet-4-20250514" |
| }, |
| "override": { |
| "endpoint": "http://127.0.0.1:1980" |
| }, |
| "ssl_verify": false |
| }, |
| "ai-rate-limiting": { |
| "limit": 100, |
| "time_window": 60, |
| "limit_strategy": "expression", |
| "cost_expr": "input_tokens - cache_read_input_tokens" |
| } |
| }, |
| "upstream": { |
| "type": "roundrobin", |
| "nodes": { |
| "canbeanything.com": 1 |
| } |
| } |
| }]] |
| ) |
| |
| if code >= 300 then |
| ngx.status = code |
| end |
| ngx.say(body) |
| } |
| } |
| --- response_body |
| passed |
| |
| |
| |
| === TEST 13: negative expression result clamped to 0 - cost = 50 - 200 = -150, clamped to 0 |
| --- more_headers |
| X-AI-Fixture: anthropic/messages-with-cache.json |
| --- pipelined_requests eval |
| [ |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| "POST /v1/messages\n" . '{"model":"claude-sonnet-4-20250514","max_tokens":1024,"messages":[{"role":"user","content":"Hello"}]}', |
| ] |
| --- response_headers_like eval |
| [ |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 100", |
| "X-AI-RateLimit-Remaining-ai-proxy-anthropic: 100", |
| ] |
| --- no_error_log |
| [error] |