11#include " inference_service.h"
2+ #include < drogon/HttpTypes.h>
23#include " utils/engine_constants.h"
34#include " utils/function_calling/common.h"
45
56namespace services {
6-
7- namespace {
8- constexpr const int k200OK = 200 ;
9- constexpr const int k400BadRequest = 400 ;
10- constexpr const int k409Conflict = 409 ;
11- constexpr const int k500InternalServerError = 500 ;
12- } // namespace
13-
147cpp::result<void , InferResult> InferenceService::HandleChatCompletion (
158 std::shared_ptr<SyncQueue> q, std::shared_ptr<Json::Value> json_body) {
169 std::string engine_type;
@@ -26,7 +19,7 @@ cpp::result<void, InferResult> InferenceService::HandleChatCompletion(
2619 Json::Value res;
2720 res[" message" ] = " Engine is not loaded yet" ;
2821 Json::Value stt;
29- stt[" status_code" ] = k409Conflict ;
22+ stt[" status_code" ] = drogon::k400BadRequest ;
3023 LOG_WARN << " Engine is not loaded yet" ;
3124 return cpp::fail (std::make_pair (stt, res));
3225 }
@@ -54,9 +47,9 @@ cpp::result<void, InferResult> InferenceService::HandleEmbedding(
5447 auto engine_result = engine_service_->GetLoadedEngine (engine_type);
5548 if (engine_result.has_error ()) {
5649 Json::Value res;
57- res[" message" ] = " Engine is not loaded yet" ;
5850 Json::Value stt;
59- stt[" status_code" ] = k409Conflict;
51+ res[" message" ] = " Engine is not loaded yet" ;
52+ stt[" status_code" ] = drogon::k400BadRequest;
6053 LOG_WARN << " Engine is not loaded yet" ;
6154 return cpp::fail (std::make_pair (stt, res));
6255 }
@@ -84,7 +77,7 @@ InferResult InferenceService::LoadModel(
8477
8578 r[" message" ] = " Could not load engine " + engine_type + " : " +
8679 load_engine_result.error ();
87- stt[" status_code" ] = k500InternalServerError;
80+ stt[" status_code" ] = drogon:: k500InternalServerError;
8881 return std::make_pair (stt, r);
8982 }
9083
@@ -114,7 +107,7 @@ InferResult InferenceService::UnloadModel(
114107 Json::Value res;
115108 res[" message" ] = " Engine is not loaded yet" ;
116109 Json::Value stt;
117- stt[" status_code" ] = k409Conflict ;
110+ stt[" status_code" ] = drogon::k400BadRequest ;
118111 LOG_WARN << " Engine is not loaded yet" ;
119112 return std::make_pair (stt, res);
120113 }
@@ -145,7 +138,7 @@ InferResult InferenceService::GetModelStatus(
145138 Json::Value res;
146139 res[" message" ] = " Engine is not loaded yet" ;
147140 Json::Value stt;
148- stt[" status_code" ] = k409Conflict ;
141+ stt[" status_code" ] = drogon::k400BadRequest ;
149142 LOG_WARN << " Engine is not loaded yet" ;
150143 return std::make_pair (stt, res);
151144 }
@@ -168,7 +161,7 @@ InferResult InferenceService::GetModels(
168161 auto loaded_engines = engine_service_->GetLoadedEngines ();
169162 if (loaded_engines.empty ()) {
170163 r[" message" ] = " No engine is loaded yet" ;
171- stt[" status_code" ] = k400BadRequest;
164+ stt[" status_code" ] = drogon:: k400BadRequest;
172165 return std::make_pair (stt, r);
173166 }
174167
@@ -189,7 +182,7 @@ InferResult InferenceService::GetModels(
189182 Json::Value root;
190183 root[" data" ] = resp_data;
191184 root[" object" ] = " list" ;
192- stt[" status_code" ] = k200OK;
185+ stt[" status_code" ] = drogon:: k200OK;
193186 return std::make_pair (stt, root);
194187}
195188
@@ -215,7 +208,7 @@ InferResult InferenceService::FineTuning(
215208 //
216209 // Json::Value res;
217210 // r["message"] = "Could not load engine " + ne;
218- // stt["status_code"] = k500InternalServerError;
211+ // stt["status_code"] = drogon:: k500InternalServerError;
219212 // return std::make_pair(stt, r);
220213 // }
221214 //
@@ -236,7 +229,7 @@ InferResult InferenceService::FineTuning(
236229 // } else {
237230 // LOG_WARN << "Method is not supported yet";
238231 r[" message" ] = " Method is not supported yet" ;
239- stt[" status_code" ] = k500InternalServerError;
232+ stt[" status_code" ] = drogon:: k500InternalServerError;
240233 // return std::make_pair(stt, r);
241234 // }
242235 // LOG_TRACE << "Done fine-tuning";
0 commit comments