chore: rectify business logic/code in ai-proxy (apache#12055)

shreemaan-abhishek · web-flow · commit 99a079258d39 · 2025-03-17T19:29:37.000+05:45
diff --git a/apisix/init.lua b/apisix/init.lua
@@ -453,6 +453,12 @@ end
 
 
 function _M.handle_upstream(api_ctx, route, enable_websocket)
+    -- some plugins(ai-proxy...) request upstream by http client directly
+    if api_ctx.bypass_nginx_upstream then
+        common_phase("before_proxy")
+        return
+    end
+
     local up_id = route.value.upstream_id
 
     -- used for the traffic-split plugin
diff --git a/apisix/plugins/ai-drivers/openai-base.lua b/apisix/plugins/ai-drivers/openai-base.lua
@@ -141,22 +141,25 @@ end
 function _M.read_response(ctx, res)
     local body_reader = res.body_reader
     if not body_reader then
-        core.log.error("AI service sent no response body")
+        core.log.warn("AI service sent no response body")
         return 500
     end
 
     local content_type = res.headers["Content-Type"]
     core.response.set_header("Content-Type", content_type)
 
-    if core.string.find(content_type, "text/event-stream") then
+    if content_type and core.string.find(content_type, "text/event-stream") then
         while true do
             local chunk, err = body_reader() -- will read chunk by chunk
             if err then
-                core.log.error("failed to read response chunk: ", err)
-                break
+                core.log.warn("failed to read response chunk: ", err)
+                if core.string.find(err, "timeout") then
+                    return 504
+                end
+                return 500
             end
             if not chunk then
-                break
+                return
             end
 
             ngx_print(chunk)
@@ -192,6 +195,8 @@ function _M.read_response(ctx, res)
 
                 -- usage field is null for non-last events, null is parsed as userdata type
                 if data and data.usage and type(data.usage) ~= "userdata" then
+                    core.log.info("got token usage from ai service: ",
+                                        core.json.delay_encode(data.usage))
                     ctx.ai_token_usage = {
                         prompt_tokens = data.usage.prompt_tokens or 0,
                         completion_tokens = data.usage.completion_tokens or 0,
@@ -202,19 +207,22 @@ function _M.read_response(ctx, res)
 
             ::CONTINUE::
         end
-        return
     end
 
     local raw_res_body, err = res:read_body()
     if not raw_res_body then
-        core.log.error("failed to read response body: ", err)
+        core.log.warn("failed to read response body: ", err)
+        if core.string.find(err, "timeout") then
+            return 504
+        end
         return 500
     end
     local res_body, err = core.json.decode(raw_res_body)
     if err then
         core.log.warn("invalid response body from ai service: ", raw_res_body, " err: ", err,
             ", it will cause token usage not available")
     else
+        core.log.info("got token usage from ai service: ", core.json.delay_encode(res_body.usage))
         ctx.ai_token_usage = {
             prompt_tokens = res_body.usage and res_body.usage.prompt_tokens or 0,
             completion_tokens = res_body.usage and res_body.usage.completion_tokens or 0,
diff --git a/apisix/plugins/ai-proxy-multi.lua b/apisix/plugins/ai-proxy-multi.lua
@@ -217,6 +217,7 @@ function _M.access(conf, ctx)
     end
     ctx.picked_ai_instance_name = name
     ctx.picked_ai_instance = ai_instance
+    ctx.bypass_nginx_upstream = true
 end
 
 
diff --git a/apisix/plugins/ai-proxy.lua b/apisix/plugins/ai-proxy.lua
@@ -47,6 +47,7 @@ end
 function _M.access(conf, ctx)
     ctx.picked_ai_instance_name = "ai-proxy"
     ctx.picked_ai_instance = conf
+    ctx.bypass_nginx_upstream = true
 end
 
 
diff --git a/apisix/plugins/ai-proxy/base.lua b/apisix/plugins/ai-proxy/base.lua
@@ -46,7 +46,10 @@ function _M.before_proxy(conf, ctx)
 
     local res, err = ai_driver:request(conf, request_body, extra_opts)
     if not res then
-        core.log.error("failed to send request to AI service: ", err)
+        core.log.warn("failed to send request to AI service: ", err)
+        if core.string.find(err, "timeout") then
+            return 504
+        end
         return internal_server_error
     end
 
diff --git a/apisix/plugins/ai-proxy/schema.lua b/apisix/plugins/ai-proxy/schema.lua
@@ -120,7 +120,7 @@ local ai_instance_schema = {
                 },
             },
         },
-        required = {"name", "provider", "auth"}
+        required = {"name", "provider", "auth", "weight"}
     },
 }
 
@@ -139,7 +139,6 @@ _M.ai_proxy_schema = {
         timeout = {
             type = "integer",
             minimum = 1,
-            maximum = 60000,
             default = 30000,
             description = "timeout in milliseconds",
         },
@@ -196,7 +195,6 @@ _M.ai_proxy_multi_schema = {
         timeout = {
             type = "integer",
             minimum = 1,
-            maximum = 60000,
             default = 30000,
             description = "timeout in milliseconds",
         },
diff --git a/t/plugin/ai-proxy-multi.balancer.t b/t/plugin/ai-proxy-multi.balancer.t
@@ -198,12 +198,6 @@ __DATA__
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -308,12 +302,6 @@ deepseek.deepseek.openai.openai.openai.openai.openai.openai.openai.openai
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
diff --git a/t/plugin/ai-proxy-multi.openai-compatible.t b/t/plugin/ai-proxy-multi.openai-compatible.t
@@ -160,12 +160,6 @@ __DATA__
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -227,12 +221,6 @@ qr/\{ "content": "1 \+ 1 = 2\.", "role": "assistant" \}/
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
diff --git a/t/plugin/ai-proxy-multi.t b/t/plugin/ai-proxy-multi.t
@@ -230,12 +230,6 @@ qr/.*property "provider" validation failed: matches none of the enum values*/
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -294,12 +288,6 @@ Unauthorized
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -417,12 +405,6 @@ request format doesn't match schema: property "messages" is required
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
@@ -492,12 +474,6 @@ options_works
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
@@ -567,12 +543,6 @@ path override works
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
diff --git a/t/plugin/ai-proxy-multi2.t b/t/plugin/ai-proxy-multi2.t
@@ -145,12 +145,6 @@ __DATA__
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
@@ -209,12 +203,6 @@ Unauthorized
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
@@ -333,12 +321,6 @@ POST /anything
                             ],
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                  }]]
             )
diff --git a/t/plugin/ai-proxy.openai-compatible.t b/t/plugin/ai-proxy.openai-compatible.t
@@ -148,12 +148,6 @@ __DATA__
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -208,12 +202,6 @@ qr/\{ "content": "1 \+ 1 = 2\.", "role": "assistant" \}/
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -277,12 +265,6 @@ path override works
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
diff --git a/t/plugin/ai-proxy.t b/t/plugin/ai-proxy.t
@@ -206,12 +206,6 @@ qr/.*property "provider" validation failed: matches none of the enum values.*/
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -264,12 +258,6 @@ Unauthorized
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -381,12 +369,6 @@ request format doesn't match schema: property "messages" is required
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -450,12 +432,6 @@ options_works
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
@@ -519,12 +495,6 @@ path override works
                             },
                             "ssl_verify": false
                         }
-                    },
-                    "upstream": {
-                        "type": "roundrobin",
-                        "nodes": {
-                            "canbeanything.com": 1
-                        }
                     }
                 }]]
             )
diff --git a/t/plugin/ai-proxy2.t b/t/plugin/ai-proxy2.t

Original file line number	Diff line number	Diff line change
`@@ -198,12 +198,6 @@ __DATA__`
`198`	`198`	`],`
`199`	`199`	`"ssl_verify": false`
`200`	`200`	`}`
`201`		`- },`
`202`		`- "upstream": {`
`203`		`- "type": "roundrobin",`
`204`		`- "nodes": {`
`205`		`- "canbeanything.com": 1`
`206`		`- }`
`207`	`201`	`}`
`208`	`202`	`}]]`
`209`	`203`	`)`
`@@ -308,12 +302,6 @@ deepseek.deepseek.openai.openai.openai.openai.openai.openai.openai.openai`
`308`	`302`	`],`
`309`	`303`	`"ssl_verify": false`
`310`	`304`	`}`
`311`		`- },`
`312`		`- "upstream": {`
`313`		`- "type": "roundrobin",`
`314`		`- "nodes": {`
`315`		`- "canbeanything.com": 1`
`316`		`- }`
`317`	`305`	`}`
`318`	`306`	`}]]`
`319`	`307`	`)`
Original file line number	Diff line number	Diff line change
`@@ -160,12 +160,6 @@ __DATA__`
`160`	`160`	`],`
`161`	`161`	`"ssl_verify": false`
`162`	`162`	`}`
`163`		`- },`
`164`		`- "upstream": {`
`165`		`- "type": "roundrobin",`
`166`		`- "nodes": {`
`167`		`- "canbeanything.com": 1`
`168`		`- }`
`169`	`163`	`}`
`170`	`164`	`}]]`
`171`	`165`	`)`
`@@ -227,12 +221,6 @@ qr/\{ "content": "1 \+ 1 = 2\.", "role": "assistant" \}/`
`227`	`221`	`],`
`228`	`222`	`"ssl_verify": false`
`229`	`223`	`}`
`230`		`- },`
`231`		`- "upstream": {`
`232`		`- "type": "roundrobin",`
`233`		`- "nodes": {`
`234`		`- "canbeanything.com": 1`
`235`		`- }`
`236`	`224`	`}`
`237`	`225`	`}]]`
`238`	`226`	`)`
Original file line number	Diff line number	Diff line change
`@@ -230,12 +230,6 @@ qr/.property "provider" validation failed: matches none of the enum values/`
`230`	`230`	`],`
`231`	`231`	`"ssl_verify": false`
`232`	`232`	`}`
`233`		`- },`
`234`		`- "upstream": {`
`235`		`- "type": "roundrobin",`
`236`		`- "nodes": {`
`237`		`- "canbeanything.com": 1`
`238`		`- }`
`239`	`233`	`}`
`240`	`234`	`}]]`
`241`	`235`	`)`
`@@ -294,12 +288,6 @@ Unauthorized`
`294`	`288`	`],`
`295`	`289`	`"ssl_verify": false`
`296`	`290`	`}`
`297`		`- },`
`298`		`- "upstream": {`
`299`		`- "type": "roundrobin",`
`300`		`- "nodes": {`
`301`		`- "canbeanything.com": 1`
`302`		`- }`
`303`	`291`	`}`
`304`	`292`	`}]]`
`305`	`293`	`)`
`@@ -417,12 +405,6 @@ request format doesn't match schema: property "messages" is required`
`417`	`405`	`],`
`418`	`406`	`"ssl_verify": false`
`419`	`407`	`}`
`420`		`- },`
`421`		`- "upstream": {`
`422`		`- "type": "roundrobin",`
`423`		`- "nodes": {`
`424`		`- "canbeanything.com": 1`
`425`		`- }`
`426`	`408`	`}`
`427`	`409`	`}]]`
`428`	`410`	`)`
`@@ -492,12 +474,6 @@ options_works`
`492`	`474`	`],`
`493`	`475`	`"ssl_verify": false`
`494`	`476`	`}`
`495`		`- },`
`496`		`- "upstream": {`
`497`		`- "type": "roundrobin",`
`498`		`- "nodes": {`
`499`		`- "canbeanything.com": 1`
`500`		`- }`
`501`	`477`	`}`
`502`	`478`	`}]]`
`503`	`479`	`)`
`@@ -567,12 +543,6 @@ path override works`
`567`	`543`	`],`
`568`	`544`	`"ssl_verify": false`
`569`	`545`	`}`
`570`		`- },`
`571`		`- "upstream": {`
`572`		`- "type": "roundrobin",`
`573`		`- "nodes": {`
`574`		`- "canbeanything.com": 1`
`575`		`- }`
`576`	`546`	`}`
`577`	`547`	`}]]`
`578`	`548`	`)`
Original file line number	Diff line number	Diff line change
`@@ -145,12 +145,6 @@ __DATA__`
`145`	`145`	`],`
`146`	`146`	`"ssl_verify": false`
`147`	`147`	`}`
`148`		`- },`
`149`		`- "upstream": {`
`150`		`- "type": "roundrobin",`
`151`		`- "nodes": {`
`152`		`- "canbeanything.com": 1`
`153`		`- }`
`154`	`148`	`}`
`155`	`149`	`}]]`
`156`	`150`	`)`
`@@ -209,12 +203,6 @@ Unauthorized`
`209`	`203`	`],`
`210`	`204`	`"ssl_verify": false`
`211`	`205`	`}`
`212`		`- },`
`213`		`- "upstream": {`
`214`		`- "type": "roundrobin",`
`215`		`- "nodes": {`
`216`		`- "canbeanything.com": 1`
`217`		`- }`
`218`	`206`	`}`
`219`	`207`	`}]]`
`220`	`208`	`)`
`@@ -333,12 +321,6 @@ POST /anything`
`333`	`321`	`],`
`334`	`322`	`"ssl_verify": false`
`335`	`323`	`}`
`336`		`- },`
`337`		`- "upstream": {`
`338`		`- "type": "roundrobin",`
`339`		`- "nodes": {`
`340`		`- "canbeanything.com": 1`
`341`		`- }`
`342`	`324`	`}`
`343`	`325`	`}]]`
`344`	`326`	`)`