gizatechxyz · canacechan · Mar 27, 2024 · Mar 28, 2024 · Mar 31, 2024 · Apr 1, 2024
diff --git a/docgen/src/main.rs b/docgen/src/main.rs
@@ -59,6 +59,14 @@ fn main() {
     doc_trait(trait_path, doc_path, label);
     doc_functions(trait_path, doc_path, trait_name, label);
 
+    // TREE ENSEMBLE DOC
+    let trait_path = "src/operators/ml/tree_ensemble/tree_ensemble.cairo";
+    let doc_path = "docs/framework/operators/machine-learning/tree-ensemble";
+    let label = "tree_ensemble";
+    let trait_name: &str = "TreeEnsembleTrait";
+    doc_trait(trait_path, doc_path, label);
+    doc_functions(trait_path, doc_path, trait_name, label);
+
     // LINEAR REGRESSOR DOC
     let trait_path = "src/operators/ml/linear/linear_regressor.cairo";
     let doc_path = "docs/framework/operators/machine-learning/linear-regressor";

diff --git a/docs/framework/operators/machine-learning/tree-ensemble/README.md b/docs/framework/operators/machine-learning/tree-ensemble/README.md
@@ -0,0 +1,22 @@
+# Tree Ensemble 
+
+`TreeEnsembleTrait` provides a trait definition for tree ensemble problem.
+
+```rust
+use orion::operators::ml::TreeEnsembleTrait;
+```
+
+### Data types
+
+Orion supports currently only fixed point data types for `TreeEnsembleTrait`.
+
+| Data type            | dtype                                                         |
+| -------------------- | ------------------------------------------------------------- |
+| Fixed point (signed) | `TreeEnsembleTrait<FP8x23 \| FP16x16 \| FP64x64 \| FP32x32>` |
+
+
+***
+
+| function | description |
+| --- | --- |
+| [`tree_ensemble.predict`](tree_ensemble.predict.md) | Returns the regressed values for each input in a batch. |
diff --git a/docs/framework/operators/machine-learning/tree-ensemble/tree_ensemble.predict.md b/docs/framework/operators/machine-learning/tree-ensemble/tree_ensemble.predict.md
@@ -0,0 +1,139 @@
+# TreeEnsemble::predict
+
+```rust 
+   fn predict(X: @Tensor<T>,
+                  nodes_splits: Tensor<T>,
+                  nodes_featureids: Span<usize>,
+                  nodes_modes: Span<MODE>,
+                  nodes_truenodeids: Span<usize>,
+                  nodes_falsenodeids: Span<usize>,
+                  nodes_trueleafs: Span<usize>,
+                  nodes_falseleafs: Span<usize>,
+                  leaf_targetids: Span<usize>,
+                  leaf_weights: Tensor<T>,
+                  tree_roots: Span<usize>,
+                  post_transform: POST_TRANSFORM,
+                  aggregate_function: AGGREGATE_FUNCTION,
+                  nodes_hitrates: Option<Tensor<T>>,
+                  nodes_missing_value_tracks_true: Option<Span<usize>>,
+                  membership_values: Option<Tensor<T>>,
+                  n_targets: usize
+              ) -> MutMatrix::<T>;
+```
+
+Tree Ensemble operator. Returns the regressed values for each input in a batch. Inputs have dimensions [N, F] where N is the input batch size and F is the number of input features. Outputs have dimensions [N, num_targets] where N is the batch size and num_targets is the number of targets, which is a configurable attribute.
+
+## Args
+
+* `X`:  Input 2D tensor.
+* `nodes_splits`: Thresholds to do the splitting on for each node with mode that is not 'BRANCH_MEMBER'.
+* `nodes_featureids`: Feature id for each node.
+* `nodes_modes`: The comparison operation performed by the node. This is encoded as an enumeration of 'NODE_MODE::LEQ', 'NODE_MODE::LT', 'NODE_MODE::GTE', 'NODE_MODE::GT', 'NODE_MODE::EQ', 'NODE_MODE::NEQ', and 'NODE_MODE::MEMBER'
+* `nodes_truenodeids`: If `nodes_trueleafs` is 0 (false) at an entry, this represents the position of the true branch node. 
+* `nodes_falsenodeids`: If `nodes_falseleafs` is 0 (false) at an entry, this represents the position of the false branch node.
+* `nodes_trueleafs`: 1 if true branch is leaf for each node and 0 an interior node.
+* `nodes_falseleafs`: 1 if true branch is leaf for each node and 0 an interior node.
+* `leaf_targetids`: The index of the target that this leaf contributes to (this must be in range `[0, n_targets)`).
+* `leaf_weights`: The weight for each leaf.
+* `tree_roots`: Index into `nodes_*` for the root of each tree. The tree structure is derived from the branching of each node.
+* `post_transform`: Indicates the transform to apply to the score.One of 'POST_TRANSFORM::NONE', 'POST_TRANSFORM::SOFTMAX', 'POST_TRANSFORM::LOGISTIC', 'POST_TRANSFORM::SOFTMAX_ZERO'  or 'POST_TRANSFORM::PROBIT' ,
+* `aggregate_function`: Defines how to aggregate leaf values within a target. One of 'AGGREGATE_FUNCTION::AVERAGE', 'AGGREGATE_FUNCTION::SUM', 'AGGREGATE_FUNCTION::MIN', 'AGGREGATE_FUNCTION::MAX` defaults to 'AGGREGATE_FUNCTION::SUM' 
+* `nodes_hitrates`: Popularity of each node, used for performance and may be omitted.
+* `nodes_missing_value_tracks_true`: For each node, define whether to follow the true branch (if attribute value is 1) or false branch (if attribute value is 0) in the presence of a NaN input feature. This attribute may be left undefined and the default value is false (0) for all nodes.
+* `membership_values`: Members to test membership of for each set membership node. List all of the members to test again in the order that the 'BRANCH_MEMBER' mode appears in `node_modes`, delimited by `NaN`s. Will have the same number of sets of values as nodes with mode 'BRANCH_MEMBER'. This may be omitted if the node doesn't contain any 'BRANCH_MEMBER' nodes.
+* `n_targets`: The total number of targets.
+
+
+## Returns
+
+* Output of shape [Batch Size, Number of targets]
+
+## Type Constraints
+
+`TreeEnsembleClassifier` and `X` must be fixed points
+
+## Examples
+
+```rust
+use orion::numbers::FP16x16;
+use orion::operators::tensor::{Tensor, TensorTrait, FP16x16Tensor, U32Tensor};
+use orion::operators::ml::{TreeEnsembleTrait,POST_TRANSFORM, AGGREGATE_FUNCTION, NODE_MODE};
+use orion::operators::matrix::{MutMatrix, MutMatrixImpl};
+use orion::numbers::NumberTrait;
+
+fn example_tree_ensemble_one_tree() ->  MutMatrix::<FP16x16> {
+    let mut shape = ArrayTrait::<usize>::new();
+    shape.append(3);
+    shape.append(2);
+
+    let mut data = ArrayTrait::new();
+    data.append(FP16x16 { mag: 78643, sign: false });
+    data.append(FP16x16 { mag: 222822, sign: false });
+    data.append(FP16x16 { mag: 7864, sign: true });
+    data.append(FP16x16 { mag: 108789, sign: false });
+    data.append(FP16x16 { mag: 271319, sign: false });
+    data.append(FP16x16 { mag: 115998, sign: false });
+    let mut X = TensorTrait::new(shape.span(), data.span());
+
+    let mut shape = ArrayTrait::<usize>::new();
+    shape.append(4);
+
+    let mut data = ArrayTrait::new();
+    data.append(FP16x16 { mag: 342753, sign: false });
+    data.append(FP16x16 { mag: 794296, sign: false });
+    data.append(FP16x16 { mag: 801505, sign: true });
+    data.append(FP16x16 { mag: 472514, sign: false });
+    let leaf_weights = TensorTrait::new(shape.span(), data.span());
+
+    let mut shape = ArrayTrait::<usize>::new();
+    shape.append(3);
+
+    let mut data = ArrayTrait::new();
+    data.append(FP16x16 { mag: 205783, sign: false });
+    data.append(FP16x16 { mag: 78643, sign: false });
+    data.append(FP16x16 { mag: 275251, sign: false });
+    let nodes_splits = TensorTrait::new(shape.span(), data.span());
+
+    let membership_values = Option::None;
+
+    let n_targets = 2;
+    let aggregate_function = AGGREGATE_FUNCTION::SUM;
+    let nodes_missing_value_tracks_true = Option::None;
+    let nodes_hitrates = Option::None;
+    let post_transform = POST_TRANSFORM::NONE;
+
+    let tree_roots: Span<usize> = array![0].span();
+    let nodes_modes: Span<MODE> = array![MODE::LEQ, MODE::LEQ, MODE::LEQ].span();
+
+    let nodes_featureids: Span<usize> = array![0, 0, 0].span();
+    let nodes_truenodeids: Span<usize> = array![1, 0, 1].span();
+    let nodes_trueleafs: Span<usize> = array![0, 1, 1].span();
+    let nodes_falsenodeids: Span<usize> = array![2, 2, 3].span();
+    let nodes_falseleafs: Span<usize> = array![0, 1, 1].span();
+    let leaf_targetids: Span<usize> = array![0, 1, 0, 1].span();
+
+    return TreeEnsembleTrait::predict(
+        @X,
+        nodes_splits,
+        nodes_featureids,
+        nodes_modes,
+        nodes_truenodeids,
+        nodes_falsenodeids,
+        nodes_trueleafs,
+        nodes_falseleafs,
+        leaf_targetids,
+        leaf_weights,
+        tree_roots,
+        post_transform,
+        aggregate_function,
+        nodes_hitrates,
+        nodes_missing_value_tracks_true,
+        membership_values,
+        n_targets
+    );
+}
+
+>>> [[ 5.23  0.  ]
+     [ 5.23  0.  ]
+     [ 0.   12.12]]    
+```
diff --git a/docs/framework/operators/tensor/README.md b/docs/framework/operators/tensor/README.md
@@ -132,6 +132,7 @@ use orion::operators::tensor::TensorTrait;
 | [`tensor.dynamic_quantize_linear`](tensor.dynamic\_quantize\_linear.md) | Computes the Scale, Zero Point and FP32->8Bit conversion of FP32 Input data.  |
 | [`tensor.scatter_nd`](tensor.scatter\_nd.md) | The output of the operation is produced by creating a copy of the input data, and then updating its value to values specified by updates at specific index positions specified by indices. Its output shape is the same as the shape of data |
 | [`tensor.label_encoder`](tensor.label\_encoder.md) | Maps each element in the input tensor to another value. |
+| [`tensor.mean`](tensor.mean.md) | Element-wise mean of each of the input tensors. |
 
 ## Arithmetic Operations
 

diff --git a/docs/framework/operators/tensor/tensor.mean.md b/docs/framework/operators/tensor/tensor.mean.md
@@ -0,0 +1,52 @@
+# tensor.mean
+
+```rust 
+   fn mean(args: Span<Tensor<T>>) -> Tensor<T>;
+```
+
+Element-wise mean of each of the input tensors.
+
+
+* `args`(`Span<Tensor<T>>`) - List of tensors for mean.
+
+## Returns
+
+Output tensor. 
+
+## Examples
+
+```rust
+use orion::operators::tensor::{FP8x23Tensor, FP8x23TensorAdd};
+use core::array::{ArrayTrait, SpanTrait};
+use orion::operators::tensor::{TensorTrait, Tensor};
+use orion::utils::{assert_eq, assert_seq_eq};
+use orion::operators::tensor::FP8x23TensorPartialEq;
+use orion::numbers::{FixedTrait, FP8x23};
+
+
+fn example() -> Tensor<FP8x23> {
+    let mut shape = ArrayTrait::<usize>::new();
+    shape.append(2);
+    shape.append(2);
+
+    let mut data = ArrayTrait::new();
+    data.append(FP8x23 { mag: 16777216, sign: true });
+    data.append(FP8x23 { mag: 16777216, sign: false });
+    data.append(FP8x23 { mag: 16777216, sign: true });
+    data.append(FP8x23 { mag: 16777216, sign: false });
+    let tensor1 = TensorTrait::new(shape.span(), data.span());
+
+    let mut shape2 = ArrayTrait::<usize>::new();
+    shape2.append(2);
+    shape2.append(2);
+
+    let mut data2 = ArrayTrait::new();
+    data2.append(FP8x23 { mag: 8388608, sign: false });
+    data2.append(FP8x23 { mag: 0, sign: false });
+    data2.append(FP8x23 { mag: 0, sign: false });
+    data2.append(FP8x23 { mag: 8388608, sign: false });
+    let tensor2 = TensorTrait::new(shape2.span(), data2.span());
+    return TensorTrait::mean(array![tensor1, tensor2].span());
+}
+>>> [FP8x23 { mag: 4194304, sign: false }, FP8x23 { mag: 8388608, sign: true }, FP8x23 { mag: 8388608, sign: false }, FP8x23 { mag: 12582912, sign: true }]
+```
diff --git a/nodegen/node/mean.py b/nodegen/node/mean.py
@@ -0,0 +1,94 @@
+import numpy as np
+from nodegen.node import RunAll
+from ..helpers import make_test, to_fp, Tensor, Dtype, FixedImpl, Trait, get_data_statement
+
+def mean(*args) -> np.ndarray:  # type: ignore
+    res = args[0].copy()
+    for m in args[1:]:
+        res += m
+    return (res / len(args)).astype(args[0].dtype)
+
+class Mean(RunAll):
+
+    @staticmethod
+    # We test here with fp8x23 implementation.
+    def fp8x23():
+        x = np.random.randint(-3, 3, (2, 2)).astype(np.float64)
+        y = np.random.randint(-3, 3, (2, 2)).astype(np.float64)
+        z = mean(x, y)
+
+        x = Tensor(Dtype.FP8x23, x.shape, to_fp(
+            x.flatten(), FixedImpl.FP8x23))
+        y = Tensor(Dtype.FP8x23, y.shape,  to_fp(
+            y.flatten(), FixedImpl.FP8x23))
+        z = Tensor(Dtype.FP8x23, z.shape,  to_fp(
+            z.flatten(), FixedImpl.FP8x23))
+
+        name = "mean_fp8x23"
+        make_test([x, y], z, "TensorTrait::mean(array![input_0, input_1].span())", name)
+
+    @staticmethod
+    # We test here with fp16x16 implementation.
+    def fp16x16():
+        x = np.random.randint(-3, 3, (2, 2)).astype(np.float64)
+        y = np.random.randint(-3, 3, (2, 2)).astype(np.float64)
+        z = mean(x, y)
+
+        x = Tensor(Dtype.FP16x16, x.shape, to_fp(
+            x.flatten(), FixedImpl.FP16x16))
+        y = Tensor(Dtype.FP16x16, y.shape,  to_fp(
+            y.flatten(), FixedImpl.FP16x16))
+        z = Tensor(Dtype.FP16x16, z.shape,  to_fp(
+            z.flatten(), FixedImpl.FP16x16))
+
+        name = "mean_fp16x16"
+        make_test([x, y], z, "TensorTrait::mean(array![input_0, input_1].span())", name)
+
+    @staticmethod
+    # We test here with i8 implementation.
+    def i8():
+        x = np.random.randint(0, 6, (2, 2)).astype(np.int8)
+        y = np.random.randint(0, 6, (2, 2)).astype(np.int8)
+        z = np.random.randint(0, 6, (2, 2)).astype(np.int8)
+        m = mean(x, y, z)
+
+        x = Tensor(Dtype.I8, x.shape, x.flatten())
+        y = Tensor(Dtype.I8, y.shape, y.flatten())
+        z = Tensor(Dtype.I8, z.shape, z.flatten())
+        m = Tensor(Dtype.I8, m.shape, m.flatten())
+
+        name = "mean_i8"
+        make_test([x, y, z], m, "TensorTrait::mean(array![input_0, input_1, input_2].span())", name)
+
+    @staticmethod
+    # We test here with i32 implementation.
+    def i32():
+        x = np.random.randint(0, 6, (2, 2)).astype(np.int32)
+        y = np.random.randint(0, 6, (2, 2)).astype(np.int32)
+        z = np.random.randint(0, 6, (2, 2)).astype(np.int32)
+        m = mean(x, y, z)
+
+        x = Tensor(Dtype.I32, x.shape, x.flatten())
+        y = Tensor(Dtype.I32, y.shape, y.flatten())
+        z = Tensor(Dtype.I32, z.shape, z.flatten())
+        m = Tensor(Dtype.I32, m.shape, m.flatten())
+
+        name = "mean_i32"
+        make_test([x, y, z], m, "TensorTrait::mean(array![input_0, input_1, input_2].span())", name)
+
+    @staticmethod
+    # We test here with u32 implementation.
+    def u32():
+        x = np.random.randint(0, 6, (2, 2)).astype(np.uint32)
+        y = np.random.randint(0, 6, (2, 2)).astype(np.uint32)
+        z = np.random.randint(0, 6, (2, 2)).astype(np.uint32)
+        m = mean(x, y, z)
+
+        x = Tensor(Dtype.U32, x.shape, x.flatten())
+        y = Tensor(Dtype.U32, y.shape, y.flatten())
+        z = Tensor(Dtype.U32, z.shape, z.flatten())
+        m = Tensor(Dtype.U32, m.shape, m.flatten())
+
+        name = "mean_u32"
+        make_test([x, y, z], m, "TensorTrait::mean(array![input_0, input_1, input_2].span())", name)
+
diff --git a/src/operators/ml.cairo b/src/operators/ml.cairo
@@ -3,6 +3,8 @@ mod linear;
 mod svm;
 mod normalizer;
 
+use orion::operators::ml::tree_ensemble::tree_ensemble::{TreeEnsembleTrait};
+
 use orion::operators::ml::tree_ensemble::core::{
     TreeEnsemble, TreeEnsembleAttributes, TreeEnsembleImpl, NODE_MODES
 };
@@ -32,3 +34,4 @@ enum POST_TRANSFORM {
     SOFTMAXZERO,
     PROBIT,
 }
+
diff --git a/src/operators/ml/tree_ensemble.cairo b/src/operators/ml/tree_ensemble.cairo
@@ -1,3 +1,4 @@
 mod core;
 mod tree_ensemble_classifier;
 mod tree_ensemble_regressor;
+mod tree_ensemble;