Merge pull request #325 from RedisAI/batching_threading_fix

filipecosta90 · web-flow · commit 26e352bba9b5 · 2020-04-16T19:01:51.000+01:00
Refactor batching mechanism, solve threading issue
diff --git a/src/backends.c b/src/backends.c
@@ -92,7 +92,7 @@ int RAI_LoadBackend_TensorFlow(RedisModuleCtx *ctx, const char *path) {
     return REDISMODULE_ERR;
   }
 
-  backend.model_run = (int (*)(RAI_ModelRunCtx*, RAI_Error*))
+  backend.model_run = (int (*)(RAI_ModelRunCtx**, RAI_Error*))
                       (unsigned long) dlsym(handle, "RAI_ModelRunTF");
   if (backend.model_run == NULL) {
     dlclose(handle);
@@ -157,7 +157,7 @@ int RAI_LoadBackend_TFLite(RedisModuleCtx *ctx, const char *path) {
     return REDISMODULE_ERR;
   }
 
-  backend.model_run = (int (*)(RAI_ModelRunCtx*, RAI_Error*))
+  backend.model_run = (int (*)(RAI_ModelRunCtx**, RAI_Error*))
                        (unsigned long) dlsym(handle, "RAI_ModelRunTFLite");
   if (backend.model_run == NULL) {
     dlclose(handle);
@@ -222,7 +222,7 @@ int RAI_LoadBackend_Torch(RedisModuleCtx *ctx, const char *path) {
     return REDISMODULE_ERR;
   }
 
-  backend.model_run = (int (*)(RAI_ModelRunCtx*, RAI_Error*))
+  backend.model_run = (int (*)(RAI_ModelRunCtx**, RAI_Error*))
                        (unsigned long) dlsym(handle, "RAI_ModelRunTorch");
   if (backend.model_run == NULL) {
     dlclose(handle);
@@ -311,7 +311,7 @@ int RAI_LoadBackend_ONNXRuntime(RedisModuleCtx *ctx, const char *path) {
     return REDISMODULE_ERR;
   }
 
-  backend.model_run = (int (*)(RAI_ModelRunCtx*, RAI_Error*))
+  backend.model_run = (int (*)(RAI_ModelRunCtx**, RAI_Error*))
                       (unsigned long) dlsym(handle, "RAI_ModelRunORT");
   if (backend.model_run == NULL) {
     dlclose(handle);
diff --git a/src/backends.h b/src/backends.h
@@ -14,7 +14,7 @@ typedef struct RAI_LoadedBackend {
   RAI_Model* (*model_create)(RAI_Backend, const char*, RAI_ModelOpts,
                              const char*, size_t, RAI_Error*);
   void (*model_free)(RAI_Model*, RAI_Error*);
-  int (*model_run)(RAI_ModelRunCtx*, RAI_Error*);
+  int (*model_run)(RAI_ModelRunCtx**, RAI_Error*);
   int (*model_serialize)(RAI_Model*, char**, size_t*, RAI_Error*);
 
   RAI_Script* (*script_create)(const char*, const char*, RAI_Error*);
diff --git a/src/backends/onnxruntime.c b/src/backends/onnxruntime.c
@@ -401,28 +401,28 @@ void RAI_ModelFreeORT(RAI_Model* model, RAI_Error* error) {
   model->session = NULL;
 }
 
-int RAI_ModelRunORT(RAI_ModelRunCtx *mctx, RAI_Error *error)
+int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error)
 {
   const OrtApi* ort = OrtGetApiBase()->GetApi(1);
 
-  OrtSession *session = mctx->model->session;
+  OrtSession *session = mctxs[0]->model->session;
 
   if (session == NULL) {
     RAI_SetError(error, RAI_EMODELRUN, "ERR ONNXRuntime session was not allocated");
     return 1;
   }
 
-  const size_t nbatches = array_len(mctx->batches);
+  const size_t nbatches = array_len(mctxs);
   if (nbatches == 0) {
     RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
     return 1;
   }
  
   size_t batch_sizes[nbatches];
   size_t batch_offsets[nbatches];
-  if (array_len(mctx->batches[0].inputs) > 0) {
+  if (array_len(mctxs[0]->inputs) > 0) {
     for (size_t b=0; b<nbatches; ++b) {
-      batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);
+      batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
     }
     batch_offsets[0] = 0;
     for (size_t b=1; b<nbatches; ++b) {
@@ -457,8 +457,8 @@ int RAI_ModelRunORT(RAI_ModelRunCtx *mctx, RAI_Error *error)
     OrtValue *inputs[n_input_nodes];
     OrtValue *outputs[n_output_nodes];
 
-    const size_t ninputs = array_len(mctx->batches[0].inputs);
-    const size_t noutputs = array_len(mctx->batches[0].outputs);
+    const size_t ninputs = array_len(mctxs[0]->inputs);
+    const size_t noutputs = array_len(mctxs[0]->outputs);
 
     if (ninputs != n_input_nodes) {
       char msg[70];
@@ -485,7 +485,7 @@ int RAI_ModelRunORT(RAI_ModelRunCtx *mctx, RAI_Error *error)
 
       RAI_Tensor* batched_input_tensors[nbatches];
       for (size_t b=0; b<nbatches; b++) {
-        batched_input_tensors[b] = mctx->batches[b].inputs[i].tensor;
+        batched_input_tensors[b] = mctxs[b]->inputs[i].tensor;
       }
 
       inputs[i] = RAI_OrtValueFromTensors(batched_input_tensors, nbatches, error);
@@ -545,7 +545,7 @@ int RAI_ModelRunORT(RAI_ModelRunCtx *mctx, RAI_Error *error)
           return 1;
         }
         if (output_tensor) {
-          mctx->batches[b].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
+          mctxs[b]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
           RAI_TensorFree(output_tensor);
         }
         else {
diff --git a/src/backends/onnxruntime.h b/src/backends/onnxruntime.h
@@ -14,7 +14,7 @@ RAI_Model *RAI_ModelCreateORT(RAI_Backend backend,  const char* devicestr, RAI_M
 
 void RAI_ModelFreeORT(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunORT(RAI_ModelRunCtx *mctx, RAI_Error *error);
+int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error);
 
 int RAI_ModelSerializeORT(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);
 
diff --git a/src/backends/tensorflow.c b/src/backends/tensorflow.c
@@ -419,27 +419,27 @@ void RAI_ModelFreeTF(RAI_Model* model, RAI_Error* error) {
   TF_DeleteStatus(status);
 }
 
-int RAI_ModelRunTF(RAI_ModelRunCtx* mctx, RAI_Error *error) {
+int RAI_ModelRunTF(RAI_ModelRunCtx** mctxs, RAI_Error *error) {
   TF_Status *status = TF_NewStatus();
 
-  const size_t nbatches = array_len(mctx->batches);
+  const size_t nbatches = array_len(mctxs);
   if (nbatches == 0) {
     RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
     return 1;
   }
   
-  const size_t ninputs = array_len(mctx->batches[0].inputs);
-  const size_t noutputs = array_len(mctx->batches[0].outputs);
+  const size_t ninputs = array_len(mctxs[0]->inputs);
+  const size_t noutputs = array_len(mctxs[0]->outputs);
   TF_Tensor* inputTensorsValues[ninputs];
   TF_Output inputs[ninputs];
   TF_Tensor* outputTensorsValues[noutputs];
   TF_Output outputs[noutputs];
 
   size_t batch_sizes[nbatches];
   size_t batch_offsets[nbatches];
-  if (array_len(mctx->batches[0].inputs) > 0) {
+  if (array_len(mctxs[0]->inputs) > 0) {
     for (size_t b=0; b<nbatches; ++b) {
-      batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);
+      batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
     }
     batch_offsets[0] = 0;
     for (size_t b=1; b<nbatches; ++b) {
@@ -451,12 +451,12 @@ int RAI_ModelRunTF(RAI_ModelRunCtx* mctx, RAI_Error *error) {
     RAI_Tensor* batched_input_tensors[nbatches];
 
     for (size_t b=0; b<nbatches; ++b) {
-      batched_input_tensors[b] = mctx->batches[b].inputs[i].tensor;
+      batched_input_tensors[b] = mctxs[b]->inputs[i].tensor;
     }
     // inputTensorsValues[i] = RAI_TFTensorFromTensor(mctx->inputs[i].tensor);
     inputTensorsValues[i] = RAI_TFTensorFromTensors(batched_input_tensors, nbatches);
     TF_Output port;
-    port.oper = TF_GraphOperationByName(mctx->model->model, mctx->batches[0].inputs[i].name);
+    port.oper = TF_GraphOperationByName(mctxs[0]->model->model, mctxs[0]->inputs[i].name);
     port.index = 0;
     if(port.oper == NULL){
       return 1;
@@ -466,15 +466,15 @@ int RAI_ModelRunTF(RAI_ModelRunCtx* mctx, RAI_Error *error) {
 
   for (size_t i=0 ; i<noutputs; ++i) {
     TF_Output port;
-    port.oper = TF_GraphOperationByName(mctx->model->model, mctx->batches[0].outputs[i].name);
+    port.oper = TF_GraphOperationByName(mctxs[0]->model->model, mctxs[0]->outputs[i].name);
     port.index = 0;
     if(port.oper == NULL){
       return 1;
     }
     outputs[i] = port;
   }
 
-  TF_SessionRun(mctx->model->session, NULL /* run_options */,
+  TF_SessionRun(mctxs[0]->model->session, NULL /* run_options */,
                 inputs, inputTensorsValues, ninputs,
                 outputs, outputTensorsValues, noutputs,
                 NULL /* target_opers */, 0 /* ntargets */,
@@ -496,7 +496,7 @@ int RAI_ModelRunTF(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   for(size_t i=0; i<noutputs; ++i) {
     for (size_t b=0; b<nbatches; b++) {
       RAI_Tensor* output_tensor = RAI_TensorCreateFromTFTensor(outputTensorsValues[i], batch_offsets[b], batch_sizes[b]);
-      mctx->batches[b].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
+      mctxs[b]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
       RAI_TensorFree(output_tensor);
     }
     TF_DeleteTensor(outputTensorsValues[i]);
diff --git a/src/backends/tensorflow.h b/src/backends/tensorflow.h
@@ -16,7 +16,7 @@ RAI_Model *RAI_ModelCreateTF(RAI_Backend backend, const char* devicestr, RAI_Mod
 
 void RAI_ModelFreeTF(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunTF(RAI_ModelRunCtx *mctx, RAI_Error *error);
+int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error);
 
 int RAI_ModelSerializeTF(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);
 
diff --git a/src/backends/tflite.c b/src/backends/tflite.c
@@ -82,16 +82,16 @@ void RAI_ModelFreeTFLite(RAI_Model* model, RAI_Error *error) {
   model->model = NULL;
 }
 
-int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
+int RAI_ModelRunTFLite(RAI_ModelRunCtx** mctxs, RAI_Error *error) {
 
-  const size_t nbatches = array_len(mctx->batches);
+  const size_t nbatches = array_len(mctxs);
   if (nbatches == 0) {
     RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
     return 1;
   }
 
-  const size_t ninputs = array_len(mctx->batches[0].inputs);
-  const size_t noutputs = array_len(mctx->batches[0].outputs);
+  const size_t ninputs = array_len(mctxs[0]->inputs);
+  const size_t noutputs = array_len(mctxs[0]->outputs);
 
   RAI_Tensor* inputs[ninputs];
 
@@ -103,9 +103,9 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   size_t total_batch_size = 0;
 
   if (nbatches > 1) {
-    if (array_len(mctx->batches[0].inputs) > 0) {
+    if (array_len(mctxs[0]->inputs) > 0) {
       for (size_t b=0; b<nbatches; ++b) {
-        batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);
+        batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
         total_batch_size += batch_sizes[b];
       }
       batch_offsets[0] = 0;
@@ -118,7 +118,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
       RAI_Tensor* batch[nbatches];
 
       for (size_t b=0; b<nbatches; b++) {
-        batch[b] = mctx->batches[b].inputs[i].tensor;
+        batch[b] = mctxs[b]->inputs[i].tensor;
       }
 
       inputs[i] = RAI_TensorCreateByConcatenatingTensors(batch, nbatches);
@@ -127,7 +127,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   }
   else {
     for (size_t i=0 ; i<ninputs; ++i) {
-      inputs[i] = RAI_TensorGetShallowCopy(mctx->batches[0].inputs[i].tensor);
+      inputs[i] = RAI_TensorGetShallowCopy(mctxs[0]->inputs[i].tensor);
       inputs_dl[i] = &inputs[i]->tensor;
     }
   }
@@ -137,7 +137,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   }
 
   char* error_descr = NULL;
-  tfliteRunModel(mctx->model->model,
+  tfliteRunModel(mctxs[0]->model->model,
                  ninputs, inputs_dl, noutputs, outputs_dl,
                  &error_descr, RedisModule_Alloc);
 
@@ -160,11 +160,11 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {
     }
     if (nbatches > 1) {
       for (size_t b=0; b<nbatches; b++) {
-        mctx->batches[b].outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);
+        mctxs[b]->outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);
       }
     }
     else {
-      mctx->batches[0].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
+      mctxs[0]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
     }
     RAI_TensorFree(output_tensor);
     RedisModule_Free(outputs_dl[i]);
diff --git a/src/backends/tflite.h b/src/backends/tflite.h
@@ -14,7 +14,7 @@ RAI_Model *RAI_ModelCreateTFLite(RAI_Backend backend, const char* devicestr, RAI
 
 void RAI_ModelFreeTFLite(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunTFLite(RAI_ModelRunCtx *mctx, RAI_Error *error);
+int RAI_ModelRunTFLite(RAI_ModelRunCtx **mctxs, RAI_Error *error);
 
 int RAI_ModelSerializeTFLite(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);
 
diff --git a/src/backends/torch.c b/src/backends/torch.c
@@ -68,15 +68,15 @@ void RAI_ModelFreeTorch(RAI_Model* model, RAI_Error *error) {
   torchDeallocContext(model->model);
 }
 
-int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
-  const size_t nbatches = array_len(mctx->batches);
+int RAI_ModelRunTorch(RAI_ModelRunCtx** mctxs, RAI_Error *error) {
+  const size_t nbatches = array_len(mctxs);
   if (nbatches == 0) {
     RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
     return 1;
   }
 
-  const size_t ninputs = array_len(mctx->batches[0].inputs);
-  const size_t noutputs = array_len(mctx->batches[0].outputs);
+  const size_t ninputs = array_len(mctxs[0]->inputs);
+  const size_t noutputs = array_len(mctxs[0]->outputs);
 
   RAI_Tensor* inputs[ninputs];
 
@@ -88,9 +88,9 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
 
   if (nbatches > 1) {
     size_t total_batch_size = 0;
-    if (array_len(mctx->batches[0].inputs) > 0) {
+    if (array_len(mctxs[0]->inputs) > 0) {
       for (size_t b=0; b<nbatches; ++b) {
-        batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);
+        batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
         total_batch_size += batch_sizes[b];
       }
       batch_offsets[0] = 0;
@@ -103,7 +103,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
       RAI_Tensor* batch[nbatches];
 
       for (size_t b=0; b<nbatches; b++) {
-        batch[b] = mctx->batches[b].inputs[i].tensor;
+        batch[b] = mctxs[b]->inputs[i].tensor;
       }
 
       inputs[i] = RAI_TensorCreateByConcatenatingTensors(batch, nbatches);
@@ -112,7 +112,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   }
   else {
     for (size_t i=0 ; i<ninputs; ++i) {
-      inputs[i] = RAI_TensorGetShallowCopy(mctx->batches[0].inputs[i].tensor);
+      inputs[i] = RAI_TensorGetShallowCopy(mctxs[0]->inputs[i].tensor);
       inputs_dl[i] = &inputs[i]->tensor;
     }
   }
@@ -122,7 +122,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
   }
 
   char* error_descr = NULL;
-  torchRunModel(mctx->model->model,
+  torchRunModel(mctxs[0]->model->model,
                 ninputs, inputs_dl, noutputs, outputs_dl,
                 &error_descr, RedisModule_Alloc);
 
@@ -140,11 +140,11 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {
     RAI_Tensor* output_tensor = RAI_TensorCreateFromDLTensor(outputs_dl[i]);
     if (nbatches > 1) {
       for (size_t b=0; b<nbatches; b++) {
-        mctx->batches[b].outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);
+        mctxs[b]->outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);
       }
     }
     else {
-      mctx->batches[0].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
+      mctxs[0]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
     }
     RAI_TensorFree(output_tensor);
   }
diff --git a/src/backends/torch.h b/src/backends/torch.h
@@ -15,7 +15,7 @@ RAI_Model *RAI_ModelCreateTorch(RAI_Backend backend, const char* devicestr, RAI_
 
 void RAI_ModelFreeTorch(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunTorch(RAI_ModelRunCtx *mctx, RAI_Error *error);
+int RAI_ModelRunTorch(RAI_ModelRunCtx **mctxs, RAI_Error *error);
 
 int RAI_ModelSerializeTorch(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);
 
diff --git a/src/model.c b/src/model.c
diff --git a/src/model.h b/src/model.h
diff --git a/src/model_struct.h b/src/model_struct.h
diff --git a/src/redisai.c b/src/redisai.c

Original file line number	Diff line number	Diff line change
`@@ -82,16 +82,16 @@ void RAI_ModelFreeTFLite(RAI_Model* model, RAI_Error *error) {`
`82`	`82`	`model->model = NULL;`
`83`	`83`	`}`
`84`	`84`
`85`		`-int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
	`85`	`+int RAI_ModelRunTFLite(RAI_ModelRunCtx** mctxs, RAI_Error *error) {`
`86`	`86`
`87`		`- const size_t nbatches = array_len(mctx->batches);`
	`87`	`+ const size_t nbatches = array_len(mctxs);`
`88`	`88`	`if (nbatches == 0) {`
`89`	`89`	`RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");`
`90`	`90`	`return 1;`
`91`	`91`	`}`
`92`	`92`
`93`		`- const size_t ninputs = array_len(mctx->batches[0].inputs);`
`94`		`- const size_t noutputs = array_len(mctx->batches[0].outputs);`
	`93`	`+ const size_t ninputs = array_len(mctxs[0]->inputs);`
	`94`	`+ const size_t noutputs = array_len(mctxs[0]->outputs);`
`95`	`95`
`96`	`96`	`RAI_Tensor* inputs[ninputs];`
`97`	`97`
`@@ -103,9 +103,9 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`103`	`103`	`size_t total_batch_size = 0;`
`104`	`104`
`105`	`105`	`if (nbatches > 1) {`
`106`		`- if (array_len(mctx->batches[0].inputs) > 0) {`
	`106`	`+ if (array_len(mctxs[0]->inputs) > 0) {`
`107`	`107`	`for (size_t b=0; b<nbatches; ++b) {`
`108`		`- batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);`
	`108`	`+ batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);`
`109`	`109`	`total_batch_size += batch_sizes[b];`
`110`	`110`	`}`
`111`	`111`	`batch_offsets[0] = 0;`
`@@ -118,7 +118,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`118`	`118`	`RAI_Tensor* batch[nbatches];`
`119`	`119`
`120`	`120`	`for (size_t b=0; b<nbatches; b++) {`
`121`		`- batch[b] = mctx->batches[b].inputs[i].tensor;`
	`121`	`+ batch[b] = mctxs[b]->inputs[i].tensor;`
`122`	`122`	`}`
`123`	`123`
`124`	`124`	`inputs[i] = RAI_TensorCreateByConcatenatingTensors(batch, nbatches);`
`@@ -127,7 +127,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`127`	`127`	`}`
`128`	`128`	`else {`
`129`	`129`	`for (size_t i=0 ; i<ninputs; ++i) {`
`130`		`- inputs[i] = RAI_TensorGetShallowCopy(mctx->batches[0].inputs[i].tensor);`
	`130`	`+ inputs[i] = RAI_TensorGetShallowCopy(mctxs[0]->inputs[i].tensor);`
`131`	`131`	`inputs_dl[i] = &inputs[i]->tensor;`
`132`	`132`	`}`
`133`	`133`	`}`
`@@ -137,7 +137,7 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`137`	`137`	`}`
`138`	`138`
`139`	`139`	`char* error_descr = NULL;`
`140`		`- tfliteRunModel(mctx->model->model,`
	`140`	`+ tfliteRunModel(mctxs[0]->model->model,`
`141`	`141`	`ninputs, inputs_dl, noutputs, outputs_dl,`
`142`	`142`	`&error_descr, RedisModule_Alloc);`
`143`	`143`
`@@ -160,11 +160,11 @@ int RAI_ModelRunTFLite(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`160`	`160`	`}`
`161`	`161`	`if (nbatches > 1) {`
`162`	`162`	`for (size_t b=0; b<nbatches; b++) {`
`163`		`- mctx->batches[b].outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);`
	`163`	`+ mctxs[b]->outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);`
`164`	`164`	`}`
`165`	`165`	`}`
`166`	`166`	`else {`
`167`		`- mctx->batches[0].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);`
	`167`	`+ mctxs[0]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);`
`168`	`168`	`}`
`169`	`169`	`RAI_TensorFree(output_tensor);`
`170`	`170`	`RedisModule_Free(outputs_dl[i]);`
Original file line number	Diff line number	Diff line change
`@@ -68,15 +68,15 @@ void RAI_ModelFreeTorch(RAI_Model* model, RAI_Error *error) {`
`68`	`68`	`torchDeallocContext(model->model);`
`69`	`69`	`}`
`70`	`70`
`71`		`-int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`72`		`- const size_t nbatches = array_len(mctx->batches);`
	`71`	`+int RAI_ModelRunTorch(RAI_ModelRunCtx** mctxs, RAI_Error *error) {`
	`72`	`+ const size_t nbatches = array_len(mctxs);`
`73`	`73`	`if (nbatches == 0) {`
`74`	`74`	`RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");`
`75`	`75`	`return 1;`
`76`	`76`	`}`
`77`	`77`
`78`		`- const size_t ninputs = array_len(mctx->batches[0].inputs);`
`79`		`- const size_t noutputs = array_len(mctx->batches[0].outputs);`
	`78`	`+ const size_t ninputs = array_len(mctxs[0]->inputs);`
	`79`	`+ const size_t noutputs = array_len(mctxs[0]->outputs);`
`80`	`80`
`81`	`81`	`RAI_Tensor* inputs[ninputs];`
`82`	`82`
`@@ -88,9 +88,9 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`88`	`88`
`89`	`89`	`if (nbatches > 1) {`
`90`	`90`	`size_t total_batch_size = 0;`
`91`		`- if (array_len(mctx->batches[0].inputs) > 0) {`
	`91`	`+ if (array_len(mctxs[0]->inputs) > 0) {`
`92`	`92`	`for (size_t b=0; b<nbatches; ++b) {`
`93`		`- batch_sizes[b] = RAI_TensorDim(mctx->batches[b].inputs[0].tensor, 0);`
	`93`	`+ batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);`
`94`	`94`	`total_batch_size += batch_sizes[b];`
`95`	`95`	`}`
`96`	`96`	`batch_offsets[0] = 0;`
`@@ -103,7 +103,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`103`	`103`	`RAI_Tensor* batch[nbatches];`
`104`	`104`
`105`	`105`	`for (size_t b=0; b<nbatches; b++) {`
`106`		`- batch[b] = mctx->batches[b].inputs[i].tensor;`
	`106`	`+ batch[b] = mctxs[b]->inputs[i].tensor;`
`107`	`107`	`}`
`108`	`108`
`109`	`109`	`inputs[i] = RAI_TensorCreateByConcatenatingTensors(batch, nbatches);`
`@@ -112,7 +112,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`112`	`112`	`}`
`113`	`113`	`else {`
`114`	`114`	`for (size_t i=0 ; i<ninputs; ++i) {`
`115`		`- inputs[i] = RAI_TensorGetShallowCopy(mctx->batches[0].inputs[i].tensor);`
	`115`	`+ inputs[i] = RAI_TensorGetShallowCopy(mctxs[0]->inputs[i].tensor);`
`116`	`116`	`inputs_dl[i] = &inputs[i]->tensor;`
`117`	`117`	`}`
`118`	`118`	`}`
`@@ -122,7 +122,7 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`122`	`122`	`}`
`123`	`123`
`124`	`124`	`char* error_descr = NULL;`
`125`		`- torchRunModel(mctx->model->model,`
	`125`	`+ torchRunModel(mctxs[0]->model->model,`
`126`	`126`	`ninputs, inputs_dl, noutputs, outputs_dl,`
`127`	`127`	`&error_descr, RedisModule_Alloc);`
`128`	`128`
`@@ -140,11 +140,11 @@ int RAI_ModelRunTorch(RAI_ModelRunCtx* mctx, RAI_Error *error) {`
`140`	`140`	`RAI_Tensor* output_tensor = RAI_TensorCreateFromDLTensor(outputs_dl[i]);`
`141`	`141`	`if (nbatches > 1) {`
`142`	`142`	`for (size_t b=0; b<nbatches; b++) {`
`143`		`- mctx->batches[b].outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);`
	`143`	`+ mctxs[b]->outputs[i].tensor = RAI_TensorCreateBySlicingTensor(output_tensor, batch_offsets[b], batch_sizes[b]);`
`144`	`144`	`}`
`145`	`145`	`}`
`146`	`146`	`else {`
`147`		`- mctx->batches[0].outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);`
	`147`	`+ mctxs[0]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);`
`148`	`148`	`}`
`149`	`149`	`RAI_TensorFree(output_tensor);`
`150`	`150`	`}`