@@ -10,7 +10,8 @@ using namespace inferences;
1010using json = nlohmann::json;
1111namespace inferences {
1212
13- server::server () {
13+ server::server (std::shared_ptr<services::InferenceService> inference_service)
14+ : inference_svc_(inference_service) {
1415#if defined(_WIN32)
1516 SetDefaultDllDirectories (LOAD_LIBRARY_SEARCH_DEFAULT_DIRS);
1617#endif
@@ -25,7 +26,7 @@ void server::ChatCompletion(
2526 auto json_body = req->getJsonObject ();
2627 bool is_stream = (*json_body).get (" stream" , false ).asBool ();
2728 auto q = std::make_shared<services::SyncQueue>();
28- auto ir = inference_svc_. HandleChatCompletion (q, json_body);
29+ auto ir = inference_svc_-> HandleChatCompletion (q, json_body);
2930 if (ir.has_error ()) {
3031 auto err = ir.error ();
3132 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(err));
@@ -47,7 +48,7 @@ void server::Embedding(const HttpRequestPtr& req,
4748 std::function<void (const HttpResponsePtr&)>&& callback) {
4849 LOG_TRACE << " Start embedding" ;
4950 auto q = std::make_shared<services::SyncQueue>();
50- auto ir = inference_svc_. HandleEmbedding (q, req->getJsonObject ());
51+ auto ir = inference_svc_-> HandleEmbedding (q, req->getJsonObject ());
5152 if (ir.has_error ()) {
5253 auto err = ir.error ();
5354 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(err));
@@ -64,7 +65,7 @@ void server::Embedding(const HttpRequestPtr& req,
6465void server::UnloadModel (
6566 const HttpRequestPtr& req,
6667 std::function<void (const HttpResponsePtr&)>&& callback) {
67- auto ir = inference_svc_. UnloadModel (req->getJsonObject ());
68+ auto ir = inference_svc_-> UnloadModel (req->getJsonObject ());
6869 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
6970 resp->setStatusCode (
7071 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
@@ -74,7 +75,7 @@ void server::UnloadModel(
7475void server::ModelStatus (
7576 const HttpRequestPtr& req,
7677 std::function<void (const HttpResponsePtr&)>&& callback) {
77- auto ir = inference_svc_. GetModelStatus (req->getJsonObject ());
78+ auto ir = inference_svc_-> GetModelStatus (req->getJsonObject ());
7879 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
7980 resp->setStatusCode (
8081 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
@@ -84,7 +85,7 @@ void server::ModelStatus(
8485void server::GetModels (const HttpRequestPtr& req,
8586 std::function<void (const HttpResponsePtr&)>&& callback) {
8687 LOG_TRACE << " Start to get models" ;
87- auto ir = inference_svc_. GetModels (req->getJsonObject ());
88+ auto ir = inference_svc_-> GetModels (req->getJsonObject ());
8889 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
8990 resp->setStatusCode (
9091 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
@@ -95,15 +96,15 @@ void server::GetModels(const HttpRequestPtr& req,
9596void server::GetEngines (
9697 const HttpRequestPtr& req,
9798 std::function<void (const HttpResponsePtr&)>&& callback) {
98- auto ir = inference_svc_. GetEngines (req->getJsonObject ());
99+ auto ir = inference_svc_-> GetEngines (req->getJsonObject ());
99100 auto resp = cortex_utils::CreateCortexHttpJsonResponse (ir);
100101 callback (resp);
101102}
102103
103104void server::FineTuning (
104105 const HttpRequestPtr& req,
105106 std::function<void (const HttpResponsePtr&)>&& callback) {
106- auto ir = inference_svc_. FineTuning (req->getJsonObject ());
107+ auto ir = inference_svc_-> FineTuning (req->getJsonObject ());
107108 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
108109 resp->setStatusCode (
109110 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
@@ -113,7 +114,7 @@ void server::FineTuning(
113114
114115void server::LoadModel (const HttpRequestPtr& req,
115116 std::function<void (const HttpResponsePtr&)>&& callback) {
116- auto ir = inference_svc_. LoadModel (req->getJsonObject ());
117+ auto ir = inference_svc_-> LoadModel (req->getJsonObject ());
117118 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
118119 resp->setStatusCode (
119120 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
@@ -124,7 +125,7 @@ void server::LoadModel(const HttpRequestPtr& req,
124125void server::UnloadEngine (
125126 const HttpRequestPtr& req,
126127 std::function<void (const HttpResponsePtr&)>&& callback) {
127- auto ir = inference_svc_. UnloadEngine (req->getJsonObject ());
128+ auto ir = inference_svc_-> UnloadEngine (req->getJsonObject ());
128129 auto resp = cortex_utils::CreateCortexHttpJsonResponse (std::get<1 >(ir));
129130 resp->setStatusCode (
130131 static_cast <HttpStatusCode>(std::get<0 >(ir)[" status_code" ].asInt ()));
0 commit comments