RedisAI
diff --git a/‎src/CMakeLists.txt‎
Lines changed: 5 additions & 0 deletions b/‎src/CMakeLists.txt‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎src/backends/backends.c‎
Lines changed: 10 additions & 10 deletions b/‎src/backends/backends.c‎
Lines changed: 10 additions & 10 deletions
diff --git a/‎src/backends/backends.h‎
Lines changed: 8 additions & 7 deletions b/‎src/backends/backends.h‎
Lines changed: 8 additions & 7 deletions
diff --git a/‎src/backends/onnxruntime.c‎
Lines changed: 10 additions & 12 deletions b/‎src/backends/onnxruntime.c‎
Lines changed: 10 additions & 12 deletions
diff --git a/‎src/backends/onnxruntime.h‎
Lines changed: 3 additions & 3 deletions b/‎src/backends/onnxruntime.h‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎src/backends/tensorflow.c‎
Lines changed: 22 additions & 15 deletions b/‎src/backends/tensorflow.c‎
Lines changed: 22 additions & 15 deletions
diff --git a/‎src/backends/tensorflow.h‎
Lines changed: 3 additions & 3 deletions b/‎src/backends/tensorflow.h‎
Lines changed: 3 additions & 3 deletions
@@ -17,8 +17,12 @@ file (GLOB BACKEND_COMMON_SRC
         util/dict.c
         util/dictionaries.c
         redis_ai_objects/tensor.c
+        redis_ai_objects/model.c
+        redis_ai_objects/stats.c
+        redis_ai_objects/script.c
         util/string_utils.c
         execution/utils.c
+        execution/execution_contexts/execution_ctx.c
         serialization/ai_datatypes.c)
 
 ADD_LIBRARY(redisai_obj OBJECT
@@ -41,6 +45,7 @@ ADD_LIBRARY(redisai_obj OBJECT
         execution/DAG/dag_builder.c
         execution/DAG/dag_execute.c
         execution/DAG/dag_op.c
+        execution/execution_contexts/execution_ctx.c
         execution/execution_contexts/modelRun_ctx.c
         execution/execution_contexts/scriptRun_ctx.c
         backends/backends.c
 
@@ -111,8 +111,8 @@ int RAI_LoadBackend_TensorFlow(RedisModuleCtx *ctx, const char *path) {
         return REDISMODULE_ERR;
     }
 
-    backend.model_run =
-        (int (*)(RAI_ModelRunCtx **, RAI_Error *))(unsigned long)dlsym(handle, "RAI_ModelRunTF");
+    backend.model_run = (int (*)(RAI_Model * model, RAI_ExecutionCtx * *ectxs, RAI_Error * error))(
+        unsigned long)dlsym(handle, "RAI_ModelRunTF");
     if (backend.model_run == NULL) {
         dlclose(handle);
         RedisModule_Log(ctx, "warning",
@@ -202,8 +202,8 @@ int RAI_LoadBackend_TFLite(RedisModuleCtx *ctx, const char *path) {
         return REDISMODULE_ERR;
     }
 
-    backend.model_run = (int (*)(RAI_ModelRunCtx **, RAI_Error *))(unsigned long)dlsym(
-        handle, "RAI_ModelRunTFLite");
+    backend.model_run = (int (*)(RAI_Model * model, RAI_ExecutionCtx * *ectxs, RAI_Error * error))(
+        unsigned long)dlsym(handle, "RAI_ModelRunTFLite");
     if (backend.model_run == NULL) {
         dlclose(handle);
         RedisModule_Log(ctx, "warning",
@@ -294,8 +294,8 @@ int RAI_LoadBackend_Torch(RedisModuleCtx *ctx, const char *path) {
         return REDISMODULE_ERR;
     }
 
-    backend.model_run =
-        (int (*)(RAI_ModelRunCtx **, RAI_Error *))(unsigned long)dlsym(handle, "RAI_ModelRunTorch");
+    backend.model_run = (int (*)(RAI_Model * model, RAI_ExecutionCtx * *ectxs, RAI_Error * error))(
+        unsigned long)dlsym(handle, "RAI_ModelRunTorch");
     if (backend.model_run == NULL) {
         dlclose(handle);
         RedisModule_Log(ctx, "warning",
@@ -338,8 +338,8 @@ int RAI_LoadBackend_Torch(RedisModuleCtx *ctx, const char *path) {
         return REDISMODULE_ERR;
     }
 
-    backend.script_run = (int (*)(RAI_ScriptRunCtx *, RAI_Error *))(unsigned long)dlsym(
-        handle, "RAI_ScriptRunTorch");
+    backend.script_run = (int (*)(RAI_Script *, const char *, RAI_ExecutionCtx *, RAI_Error *))(
+        unsigned long)dlsym(handle, "RAI_ScriptRunTorch");
     if (backend.script_run == NULL) {
         dlclose(handle);
         RedisModule_Log(ctx, "warning",
@@ -418,8 +418,8 @@ int RAI_LoadBackend_ONNXRuntime(RedisModuleCtx *ctx, const char *path) {
         return REDISMODULE_ERR;
     }
 
-    backend.model_run =
-        (int (*)(RAI_ModelRunCtx **, RAI_Error *))(unsigned long)dlsym(handle, "RAI_ModelRunORT");
+    backend.model_run = (int (*)(RAI_Model * model, RAI_ExecutionCtx * *ectxs, RAI_Error * error))(
+        unsigned long)dlsym(handle, "RAI_ModelRunORT");
     if (backend.model_run == NULL) {
         dlclose(handle);
         RedisModule_Log(ctx, "warning",
 
@@ -11,8 +11,9 @@
 #include "config/config.h"
 #include "redis_ai_objects/err.h"
 #include "redis_ai_objects/tensor.h"
-#include "redis_ai_objects/model_struct.h"
-#include "redis_ai_objects/script_struct.h"
+#include "redis_ai_objects/model.h"
+#include "redis_ai_objects/script.h"
+#include "execution/execution_contexts/execution_ctx.h"
 
 /*
  * To register a new backend to be loaded by the module, the backend needs to
@@ -25,7 +26,7 @@
  * the RAI_ModelOpts.
  *
  * * ** model_run **:  A callback function pointer that runs a model given the
- * RAI_ModelRunCtx pointer.
+ * RAI_Model pointer and an array of RAI_ExecutionCtx pointers.
  *
  * * ** model_serialize **:  A callback function pointer that serializes a model
  * given the RAI_Model pointer.
@@ -36,7 +37,7 @@
  * the RAI_Script pointer.
  *
  * * ** script_run **:  A callback function pointer that runs a model given the
- * RAI_ScriptRunCtx pointer.
+ * RAI_Script pointer and .
  */
 typedef struct RAI_LoadedBackend {
     // ** model_create_with_nodes **:  A callback function pointer that creates a
@@ -55,8 +56,8 @@ typedef struct RAI_LoadedBackend {
     void (*model_free)(RAI_Model *, RAI_Error *);
 
     // ** model_run **:  A callback function pointer that runs a model given the
-    // RAI_ModelRunCtx pointer
-    int (*model_run)(RAI_ModelRunCtx **, RAI_Error *);
+    // RAI_Model pointer and an array of RAI_ExecutionCtx pointers
+    int (*model_run)(RAI_Model *, RAI_ExecutionCtx **, RAI_Error *);
 
     // ** model_serialize **:  A callback function pointer that serializes a model
     // given the RAI_Model pointer
@@ -71,7 +72,7 @@ typedef struct RAI_LoadedBackend {
 
     // ** script_run **:  A callback function pointer that runs a model given the
     // RAI_ScriptRunCtx pointer
-    int (*script_run)(RAI_ScriptRunCtx *, RAI_Error *);
+    int (*script_run)(RAI_Script *, const char *function, RAI_ExecutionCtx *, RAI_Error *);
 
     // Returns the backend version.
     const char *(*get_version)(void);
 
@@ -482,16 +482,16 @@ void RAI_ModelFreeORT(RAI_Model *model, RAI_Error *error) {
     ort->ReleaseStatus(status);
 }
 
-int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
+int RAI_ModelRunORT(RAI_Model *model, RAI_ExecutionCtx **ectxs, RAI_Error *error) {
     const OrtApi *ort = OrtGetApiBase()->GetApi(1);
 
-    OrtSession *session = mctxs[0]->model->session;
+    OrtSession *session = RAI_ModelGetSession(model);
     if (session == NULL) {
         RAI_SetError(error, RAI_EMODELRUN, "ERR ONNXRuntime session was not allocated");
         return REDISMODULE_ERR;
     }
 
-    const size_t nbatches = array_len(mctxs);
+    const size_t nbatches = array_len(ectxs);
     if (nbatches == 0) {
         RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
         return REDISMODULE_ERR;
@@ -500,9 +500,11 @@ int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
     size_t batch_sizes[nbatches];
     size_t batch_offsets[nbatches];
     size_t total_batch_size = 0;
-    if (array_len(mctxs[0]->inputs) > 0) {
+    const size_t ninputs = RAI_ExecutionCtx_NumInputs(ectxs[0]);
+    const size_t noutputs = RAI_ExecutionCtx_NumOutputs(ectxs[0]);
+    if (ninputs > 0) {
         for (size_t b = 0; b < nbatches; ++b) {
-            batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
+            batch_sizes[b] = RAI_TensorDim(RAI_ExecutionCtx_GetInput(ectxs[b], 0), 0);
             total_batch_size += batch_sizes[b];
         }
         batch_offsets[0] = 0;
@@ -512,8 +514,6 @@ int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
     }
 
     OrtStatus *status = NULL;
-    const size_t ninputs = array_len(mctxs[0]->inputs);
-    const size_t noutputs = array_len(mctxs[0]->outputs);
     array_new_on_stack(const char *, 5, input_names);
     array_new_on_stack(const char *, 5, output_names);
     array_new_on_stack(OrtValue *, 5, inputs);
@@ -547,7 +547,7 @@ int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
 
             RAI_Tensor *batched_input_tensors[nbatches];
             for (size_t b = 0; b < nbatches; b++) {
-                batched_input_tensors[b] = mctxs[b]->inputs[i].tensor;
+                batched_input_tensors[b] = RAI_ExecutionCtx_GetInput(ectxs[b], i);
             }
             OrtValue *input;
             if (RAI_OrtValueFromTensors(batched_input_tensors, nbatches, &input, &status) !=
@@ -600,8 +600,7 @@ int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
                         goto error;
                     }
                     if (output_tensor) {
-                        mctxs[b]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
-                        RAI_TensorFree(output_tensor);
+                        RAI_ExecutionCtx_SetOutput(ectxs[b], output_tensor, i);
                     } else {
                         RedisModule_Log(NULL, "warning",
                                         "non-tensor output from ONNX models, ignoring (currently "
@@ -614,8 +613,7 @@ int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
                     goto error;
                 }
                 if (output_tensor) {
-                    mctxs[0]->outputs[i].tensor = RAI_TensorGetShallowCopy(output_tensor);
-                    RAI_TensorFree(output_tensor);
+                    RAI_ExecutionCtx_SetOutput(ectxs[0], output_tensor, i);
                 } else {
                     RedisModule_Log(NULL, "warning",
                                     "non-tensor output from ONNX models, ignoring (currently "
 
@@ -2,8 +2,8 @@
 
 #include "config/config.h"
 #include "redis_ai_objects/err.h"
-#include "redis_ai_objects/tensor_struct.h"
-#include "redis_ai_objects/model_struct.h"
+#include "redis_ai_objects/model.h"
+#include "execution/execution_contexts/execution_ctx.h"
 
 unsigned long long RAI_GetMemoryInfoORT(void);
 
@@ -16,7 +16,7 @@ RAI_Model *RAI_ModelCreateORT(RAI_Backend backend, const char *devicestr, RAI_Mo
 
 void RAI_ModelFreeORT(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunORT(RAI_ModelRunCtx **mctxs, RAI_Error *error);
+int RAI_ModelRunORT(RAI_Model *model, RAI_ExecutionCtx **ectxs, RAI_Error *error);
 
 int RAI_ModelSerializeORT(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);
 
 
@@ -2,6 +2,7 @@
 #include "backends/util.h"
 #include "backends/tensorflow.h"
 #include "util/arr.h"
+#include "execution/execution_contexts/modelRun_ctx.h"
 #include "redis_ai_objects/model.h"
 #include "redis_ai_objects/tensor.h"
 
@@ -461,17 +462,17 @@ void RAI_ModelFreeTF(RAI_Model *model, RAI_Error *error) {
     TF_DeleteStatus(status);
 }
 
-int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
+int RAI_ModelRunTF(RAI_Model *model, RAI_ExecutionCtx **ectxs, RAI_Error *error) {
     TF_Status *status = TF_NewStatus();
 
-    const size_t nbatches = array_len(mctxs);
+    const size_t nbatches = array_len(ectxs);
     if (nbatches == 0) {
         RAI_SetError(error, RAI_EMODELRUN, "ERR No batches to run");
         return 1;
     }
 
-    const size_t ninputs = array_len(mctxs[0]->inputs);
-    const size_t noutputs = array_len(mctxs[0]->outputs);
+    const size_t ninputs = RAI_ExecutionCtx_NumInputs(ectxs[0]);
+    const size_t noutputs = RAI_ExecutionCtx_NumOutputs(ectxs[0]);
     TF_Tensor *inputTensorsValues[ninputs];
     TF_Output inputs[ninputs];
     TF_Tensor *outputTensorsValues[noutputs];
@@ -482,7 +483,7 @@ int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
     size_t total_batch_size = 0;
     if (ninputs > 0) {
         for (size_t b = 0; b < nbatches; ++b) {
-            batch_sizes[b] = RAI_TensorDim(mctxs[b]->inputs[0].tensor, 0);
+            batch_sizes[b] = RAI_TensorDim(RAI_ExecutionCtx_GetInput(ectxs[b], 0), 0);
             total_batch_size += batch_sizes[b];
         }
         batch_offsets[0] = 0;
@@ -491,15 +492,18 @@ int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
         }
     }
 
+    void *tfGraph = RAI_ModelGetModel(model);
+    void *tfSession = RAI_ModelGetSession(model);
+
     for (size_t i = 0; i < ninputs; ++i) {
         RAI_Tensor *batched_input_tensors[nbatches];
 
         for (size_t b = 0; b < nbatches; ++b) {
-            batched_input_tensors[b] = mctxs[b]->inputs[i].tensor;
+            batched_input_tensors[b] = RAI_ExecutionCtx_GetInput(ectxs[b], i);
         }
         inputTensorsValues[i] = RAI_TFTensorFromTensors(batched_input_tensors, nbatches);
         TF_Output port;
-        port.oper = TF_GraphOperationByName(mctxs[0]->model->model, mctxs[0]->inputs[i].name);
+        port.oper = TF_GraphOperationByName(tfGraph, RAI_ModelGetInputName(model, i));
         port.index = 0;
         if (port.oper == NULL) {
             return 1;
@@ -509,17 +513,17 @@ int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
 
     for (size_t i = 0; i < noutputs; ++i) {
         TF_Output port;
-        port.oper = TF_GraphOperationByName(mctxs[0]->model->model, mctxs[0]->outputs[i].name);
+        port.oper = TF_GraphOperationByName(tfGraph, RAI_ModelGetOutputName(model, i));
         port.index = 0;
         if (port.oper == NULL) {
             return 1;
         }
         outputs[i] = port;
     }
 
-    TF_SessionRun(mctxs[0]->model->session, NULL /* run_options */, inputs, inputTensorsValues,
-                  ninputs, outputs, outputTensorsValues, noutputs, NULL /* target_opers */,
-                  0 /* ntargets */, NULL /* run_Metadata */, status);
+    TF_SessionRun(tfSession, NULL /* run_options */, inputs, inputTensorsValues, ninputs, outputs,
+                  outputTensorsValues, noutputs, NULL /* target_opers */, 0 /* ntargets */,
+                  NULL /* run_Metadata */, status);
 
     for (size_t i = 0; i < ninputs; ++i) {
         TF_DeleteTensor(inputTensorsValues[i]);
@@ -547,12 +551,15 @@ int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error) {
             }
 
             for (size_t b = 0; b < nbatches; b++) {
-                mctxs[b]->outputs[i].tensor = RAI_TensorCreateFromTFTensor(
-                    outputTensorsValues[i], batch_offsets[b], batch_sizes[b]);
+                RAI_ExecutionCtx_SetOutput(ectxs[b],
+                                           RAI_TensorCreateFromTFTensor(outputTensorsValues[i],
+                                                                        batch_offsets[b],
+                                                                        batch_sizes[b]),
+                                           i);
             }
         } else {
-            mctxs[0]->outputs[i].tensor =
-                RAI_TensorCreateFromTFTensor(outputTensorsValues[i], 0, -1);
+            RAI_ExecutionCtx_SetOutput(
+                ectxs[0], RAI_TensorCreateFromTFTensor(outputTensorsValues[i], 0, -1), i);
         }
         TF_DeleteTensor(outputTensorsValues[i]);
     }
 
@@ -2,8 +2,8 @@
 
 #include "config/config.h"
 #include "redis_ai_objects/err.h"
-#include "redis_ai_objects/tensor_struct.h"
-#include "redis_ai_objects/model_struct.h"
+#include "redis_ai_objects/model.h"
+#include "execution/execution_contexts/execution_ctx.h"
 
 int RAI_InitBackendTF(int (*get_api_fn)(const char *, void *));
 
@@ -14,7 +14,7 @@ RAI_Model *RAI_ModelCreateTF(RAI_Backend backend, const char *devicestr, RAI_Mod
 
 void RAI_ModelFreeTF(RAI_Model *model, RAI_Error *error);
 
-int RAI_ModelRunTF(RAI_ModelRunCtx **mctxs, RAI_Error *error);
+int RAI_ModelRunTF(RAI_Model *model, RAI_ExecutionCtx **ectxs, RAI_Error *error);
 
 int RAI_ModelSerializeTF(RAI_Model *model, char **buffer, size_t *len, RAI_Error *error);