diff --git a/daal4py/_images/d4p-kmeans-scale.jpg b/daal4py/_images/d4p-kmeans-scale.jpg deleted file mode 100755 index 5366add..0000000 Binary files a/daal4py/_images/d4p-kmeans-scale.jpg and /dev/null differ diff --git a/daal4py/_images/d4p-linreg-scale.jpg b/daal4py/_images/d4p-linreg-scale.jpg deleted file mode 100755 index 4d68a43..0000000 Binary files a/daal4py/_images/d4p-linreg-scale.jpg and /dev/null differ diff --git a/daal4py/_modules/index.html b/daal4py/_modules/index.html deleted file mode 100755 index eadb05b..0000000 --- a/daal4py/_modules/index.html +++ /dev/null @@ -1,129 +0,0 @@ - - -
- - -' + - '' + - _("Hide Search Matches") + - "
" - ) - ); - }, - - /** - * helper function to hide the search marks again - */ - hideSearchWords: () => { - document - .querySelectorAll("#searchbox .highlight-link") - .forEach((el) => el.remove()); - document - .querySelectorAll("span.highlighted") - .forEach((el) => el.classList.remove("highlighted")); - localStorage.removeItem("sphinx_highlight_terms") - }, - - initEscapeListener: () => { - // only install a listener if it is really needed - if (!DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS) return; - - document.addEventListener("keydown", (event) => { - // bail for input elements - if (BLACKLISTED_KEY_CONTROL_ELEMENTS.has(document.activeElement.tagName)) return; - // bail with special keys - if (event.shiftKey || event.altKey || event.ctrlKey || event.metaKey) return; - if (DOCUMENTATION_OPTIONS.ENABLE_SEARCH_SHORTCUTS && (event.key === "Escape")) { - SphinxHighlight.hideSearchWords(); - event.preventDefault(); - } - }); - }, -}; - -_ready(SphinxHighlight.highlightSearchWords); -_ready(SphinxHighlight.initEscapeListener); diff --git a/daal4py/_static/style.css b/daal4py/_static/style.css deleted file mode 100755 index 0ef87ff..0000000 --- a/daal4py/_static/style.css +++ /dev/null @@ -1,120 +0,0 @@ -/* override table width restrictions */ -@media screen and (min-width: 767px) { - - .wy-table-responsive table td { - /* !important prevents the common CSS stylesheets from overriding - this as on RTD they are loaded after this stylesheet */ - - white-space: normal !important; - } -} - -.code-block-caption { - color: #000; - font: italic 85%/1 arial,sans-serif; - padding: 1em 0; - text-align: center; -} - - -.collapsible { - margin-left: -10px; - background-color: #f1f1f1; - cursor: pointer; - padding: 18px 18px 18px 10px; - width: 100%; - border: none; - text-align: left; - outline: none; - font-weight: 700; - font-family: "Roboto Slab","ff-tisa-web-pro","Georgia",Arial,sans-serif; -} - -code.sig-name.descname { - white-space: initial; -} - -table.optimization-notice td { - white-space: initial; -} - -table.optimization-notice td p:last-child { - text-align: right; -} - -img.with-border { - border:1px solid #021a40; -} - -div.column { - float: left; - width: 50%; - padding: 10px; - } - -/* Clear floats after the columns */ -.column:after { - content: ""; - display: table; - clear: both; -} - -.comparison:after { - content: ""; - display: table; - clear: both; - } - -div.admonition-container { - width: 49%; - padding: 0 3px 0 0; -} - -/* Clear floats after the columns */ -.admonition-container:after { - content: ""; - display: table; - clear: both; -} - -div.quotation { - background-color: #fffff1; - padding: 1em 0 0 1em; -} - -.rst-content div[class^='highlight'] pre { - white-space: pre-wrap; -} - -/* A workaround for https://github.com/readthedocs/sphinx_rtd_theme/issues/647 - * Override display for function signatures so that there is spacing between - * types and arguments */ - .rst-content dl:not(.docutils) dt { - display: table-cell !important; -} -.rst-content dl:not(.docutils) dd { - margin-top: 6px; -} - -/* -.rst-content tt.literal, .rst-content code.literal, .highlight { - background: #f0f0f0; -} -.rst-content tt.literal, .rst-content code.literal { - color: #000000; -}*/ - - -.eqno { - margin-left: 5px; - float: right; -} -.math .headerlink { - display: none; - visibility: hidden; -} -.math:hover .headerlink { - display: inline-block; - visibility: visible; - margin-right: -0.7em; -} diff --git a/daal4py/algorithms.html b/daal4py/algorithms.html old mode 100755 new mode 100644 index ac85082..6551e43 --- a/daal4py/algorithms.html +++ b/daal4py/algorithms.html @@ -1,6757 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-See also Intel(R) oneAPI Data Analytics Library Classification.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification Decision Forest.
-Examples:
-Single-Process Decision Forest Classification Default Dense method
Single-Process Decision Forest Classification Histogram method
nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Decision forest, double or float
method (str) – [optional, default: “defaultDense”] Decision forest computation method
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
nTrees (size_t) – [optional, default: -1] Number of trees in the forest. Default is 10
observationsPerTreeFraction (double) – [optional, default: get_nan64()] Fraction of observations used for a training of one tree, 0 to 1. Default is 1 (sampling with replacement)
featuresPerNode (size_t) – [optional, default: -1] Number of features tried as possible splits per node. If 0 then sqrt(p) for classification, p/3 for regression, where p is the total number of features.
maxTreeDepth (size_t) – [optional, default: -1] Maximal tree depth. Default is 0 (unlimited)
minObservationsInLeafNode (size_t) – [optional, default: -1] Minimal number of observations in a leaf node. Default is 1 for classification, 5 for regression.
engine (engines_batchbase__iface__) – [optional, default: None] Engine for the random numbers generator used by the algorithms
impurityThreshold (double) – [optional, default: get_nan64()] Threshold value used as stopping criteria: if the impurity value in the node is smaller than the threshold then the node is not split anymore.
varImportance (str) – [optional, default: “”] Variable importance computation mode
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
memorySavingMode (bool) – [optional, default: False] If true then use memory saving (but slower) mode
bootstrap (bool) – [optional, default: False] If true then training set for a tree is a bootstrap of the whole training set
minObservationsInSplitNode (size_t) – [optional, default: -1] Minimal number of observations in a split node. Default 2
minWeightFractionInLeafNode (double) – [optional, default: get_nan64()] The minimum weighted fraction of the sum total of weights (of all the input observations) required to be at a leaf node, 0.0 to 0.5. Default is 0.0
minImpurityDecreaseInSplitNode (double) – [optional, default: get_nan64()] A node will be split if this split induces a decrease of the impurity greater than or equal to the value, non-negative. Default is 0.0
maxLeafNodes (size_t) – [optional, default: -1] Maximum number of leaf node. Default is 0 (unlimited)
maxBins (size_t) – [optional, default: -1] Used with ‘hist’ split finding method only. Maximal number of discrete bins to bucket continuous features. Default is 256. Increasing the number results in higher computation costs
minBinSize (size_t) – [optional, default: -1] Used with ‘hist’ split finding method only. Minimal number of observations in a bin. Default is 5
splitter (str) – [optional, default: “”] Sets node splitting method. Default is best
binningStrategy (str) – [optional, default: “”] Used with ‘hist’ split finding method only. Selects the strategy to group data points into bins. Allowed values are ‘quantiles’ (default), ‘averages’
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the decision_forest algorithm, double or float
method (str) – [optional, default: “defaultDense”] decision_forest computation method
votingMethod (str) – [optional, default: “”]
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (decision_forest_classification_modelptr) – Input model trained by the classification algorithm
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification Decision Tree.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Decision tree model-based training, double or float
method (str) – [optional, default: “defaultDense”] Decision tree training method
pruning (str) – [optional, default: “”] Pruning method for Decision tree
maxTreeDepth (size_t) – [optional, default: -1] Maximum tree depth. 0 means unlimited depth.
minObservationsInLeafNodes (size_t) – [optional, default: -1] Minimum number of observations in the leaf node. Can be any positive number.
nBins (size_t) – [optional, default: -1] The number of bins used to compute probabilities of the observations belonging to the class. The only supported value for current version of the library is 1.
splitCriterion (str) – [optional, default: “”] Split criterion for Decision tree classification
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
dataForPruning (data_or_file) – Pruning data set
labelsForPruning (data_or_file) – Labels of the pruning data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Decision tree model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
pruning (str) – [optional, default: “”] Pruning method for Decision tree
maxTreeDepth (size_t) – [optional, default: -1] Maximum tree depth. 0 means unlimited depth.
minObservationsInLeafNodes (size_t) – [optional, default: -1] Minimum number of observations in the leaf node. Can be any positive number.
nBins (size_t) – [optional, default: -1] The number of bins used to compute probabilities of the observations belonging to the class. The only supported value for current version of the library is 1.
splitCriterion (str) – [optional, default: “”] Split criterion for Decision tree classification
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (decision_tree_classification_modelptr) – Input model trained by the classification algorithm
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification Gradient Boosted Tree.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Gradient Boosted Trees, double or float
method (str) – [optional, default: “defaultDense”] Gradient Boosted Trees computation method
loss (str) – [optional, default: “”] Loss function type
varImportance (str) – [optional, default: “”] 64 bit integer flag VariableImportanceModes that indicates the variable importance computation modes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
splitMethod (str) – [optional, default: “”] Split finding method. Default is exact
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the gradient boosted trees training algorithm. Default is 50
maxTreeDepth (size_t) – [optional, default: -1] Maximal tree depth, 0 for unlimited. Default is 6
shrinkage (double) – [optional, default: get_nan64()] Learning rate of the boosting procedure. Scales the contribution of each tree by a factor (0, 1]. Default is 0.3
minSplitLoss (double) – [optional, default: get_nan64()] Loss regularization parameter. Min loss reduction required to make a further partition on a leaf node of the tree. Range: [0, inf). Default is 0
lambda (double) – [optional, default: get_nan64()] L2 regularization parameter on weights. Range: [0, inf). Default is 1
observationsPerTreeFraction (double) – [optional, default: get_nan64()] Fraction of observations used for a training of one tree, sampling without replacement. Range: (0, 1]. Default is 1 (no sampling, entire dataset is used)
featuresPerNode (size_t) – [optional, default: -1] Number of features tried as possible splits per node. Range : [0, p] where p is the total number of features. Default is 0 (use all features)
minObservationsInLeafNode (size_t) – [optional, default: -1] Minimal number of observations in a leaf node. Default is 5.
memorySavingMode (bool) – [optional, default: False] If true then use memory saving (but slower) mode. Default is false
engine (engines_batchbase__iface__) – [optional, default: None] Engine for the random numbers generator used by the algorithms
maxBins (size_t) – [optional, default: -1] Used with ‘inexact’ split finding method only. Maximal number of discrete bins to bucket continuous features. Default is 256. Increasing the number results in higher computation costs
minBinSize (size_t) – [optional, default: -1] Used with ‘inexact’ split finding method only. Minimal number of observations in a bin. Default is 5
internalOptions (int) – [optional, default: -1] Internal options
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the gbt algorithm, double or float
method (str) – [optional, default: “defaultDense”] gradient boosted trees computation method
nIterations (size_t) – [optional, default: -1] Number of iterations of the trained model to be used for prediction
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (gbt_classification_modelptr) – Input model trained by the classification algorithm
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library k-Nearest Neighbors (kNN).
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for KD-tree based kNN model-based training, double or float
method (str) – [optional, default: “defaultDense”] KD-tree based kNN training method
k (size_t) – [optional, default: -1] Number of neighbors
dataUseInModel (str) – [optional, default: “”] The option to enable/disable an usage of the input dataset in kNN model
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random choosing elements from training dataset
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
voteWeights (str) – [optional, default: “”] Weight function used in prediction
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – [optional, default: None] Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for KD-tree based kNN model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
k (size_t) – [optional, default: -1] Number of neighbors
dataUseInModel (str) – [optional, default: “”] The option to enable/disable an usage of the input dataset in kNN model
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random choosing elements from training dataset
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
voteWeights (str) – [optional, default: “”] Weight function used in prediction
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (kdtree_knn_classification_modelptr) – Input model trained by the classification algorithm
kdtree_knn_classification_prediction_result
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library k-Nearest Neighbors (kNN).
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for BF kNN model-based training, double or float
method (str) – [optional, default: “defaultDense”] BF kNN training method
k (size_t) – [optional, default: -1] Number of neighbors
dataUseInModel (str) – [optional, default: “”] The option to enable/disable an usage of the input dataset in kNN model
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
voteWeights (str) – [optional, default: “”] Weight function used in prediction
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random choosing elements from training dataset
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – [optional, default: None] Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for BF kNN model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
k (size_t) – [optional, default: -1] Number of neighbors
dataUseInModel (str) – [optional, default: “”] The option to enable/disable an usage of the input dataset in kNN model
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
voteWeights (str) – [optional, default: “”] Weight function used in prediction
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random choosing elements from training dataset
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (bf_knn_classification_modelptr) – Input model trained by the classification algorithm
bf_knn_classification_prediction_result
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification AdaBoost.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the AdaBoost, double or float
method (str) – [optional, default: “defaultDense”] AdaBoost computation method
weakLearnerTraining (classifier_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (classifier_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the AdaBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the AdaBoost training algorithm
learningRate (double) – [optional, default: get_nan64()] Multiplier for each classifier to shrink its contribution
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-Numpy array
-nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the AdaBoost, double or float
method (str) – [optional, default: “defaultDense”] AdaBoost computation method
weakLearnerTraining (classifier_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (classifier_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the AdaBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the AdaBoost training algorithm
learningRate (double) – [optional, default: get_nan64()] Multiplier for each classifier to shrink its contribution
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (adaboost_modelptr) – Input model trained by the classification algorithm
Properties:
-Numpy array
-Numpy array
-Numpy array
-Properties:
-Numpy array
-size_t
-size_t
-size_t
-classifier_model (or derived)
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification BrownBoost.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for BrownBoost, double or float
method (str) – [optional, default: “defaultDense”] BrownBoost computation method
weakLearnerTraining (classifier_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (classifier_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the BrownBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the BrownBoost training algorithm
newtonRaphsonAccuracyThreshold (double) – [optional, default: get_nan64()] Accuracy threshold for Newton-Raphson iterations in the BrownBoost training algorithm
newtonRaphsonMaxIterations (size_t) – [optional, default: -1] Maximal number of Newton-Raphson iterations in the BrownBoost training algorithm
degenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold needed to avoid degenerate cases in the BrownBoost training algorithm
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the BrownBoost algorithm, double or float
method (str) – [optional, default: “defaultDense”] BrownBoost computation method
weakLearnerTraining (classifier_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (classifier_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the BrownBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the BrownBoost training algorithm
newtonRaphsonAccuracyThreshold (double) – [optional, default: get_nan64()] Accuracy threshold for Newton-Raphson iterations in the BrownBoost training algorithm
newtonRaphsonMaxIterations (size_t) – [optional, default: -1] Maximal number of Newton-Raphson iterations in the BrownBoost training algorithm
degenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold needed to avoid degenerate cases in the BrownBoost training algorithm
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (brownboost_modelptr) – Input model trained by the classification algorithm
Properties:
-Numpy array
-Numpy array
-Numpy array
-Properties:
-Numpy array
-size_t
-size_t
-size_t
-classifier_model (or derived)
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification LogitBoost.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for LogitBoost, double or float
method (str) – [optional, default: “friedman”] LogitBoost computation method
weakLearnerTraining (regression_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (regression_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the LogitBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of terms in additive regression
weightsDegenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold to avoid degenerate cases when calculating weights W
responsesDegenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold to avoid degenerate cases when calculating responses Z
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the LogitBoost algorithm, double or float
method (str) – [optional, default: “defaultDense”] LogitBoost computation method
weakLearnerTraining (regression_training_batch__iface__) – [optional, default: None] The algorithm for weak learner model training
weakLearnerPrediction (regression_prediction_batch__iface__) – [optional, default: None] The algorithm for prediction based on a weak learner model
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the LogitBoost training algorithm
maxIterations (size_t) – [optional, default: -1] Maximal number of terms in additive regression
weightsDegenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold to avoid degenerate cases when calculating weights W
responsesDegenerateCasesThreshold (double) – [optional, default: get_nan64()] Threshold to avoid degenerate cases when calculating responses Z
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (logitboost_modelptr) – Input model trained by the classification algorithm
Properties:
-Numpy array
-Numpy array
-Numpy array
-Properties:
-size_t
-size_t
-size_t
-size_t
-regression_model (or derived)
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Classification Weak Learner Stump.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the the decision stump training method, double or float
method (str) – [optional, default: “defaultDense”] Decision stump training method
splitCriterion (str) – [optional, default: “”] Split criterion for stump classification
varImportance (str) – [optional, default: “”] Variable importance computation mode
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the decision stump prediction algorithm, double or float
method (str) – [optional, default: “defaultDense”] Decision stump model-based prediction method
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (stump_classification_modelptr) – Input model trained by the classification algorithm
Properties:
-Numpy array
-Numpy array
-Numpy array
-Properties:
-double
-size_t
-size_t
-double
-size_t
-double
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Naive Bayes.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for multinomial naive Bayes training, double or float
method (str) – [optional, default: “defaultDense”] Computation method
priorClassEstimates (array) – [optional, default: None] Prior class estimates
alpha (array) – [optional, default: None] Imagined occurrences of the each word
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for prediction based on the multinomial naive Bayes model, double or float
method (str) – [optional, default: “defaultDense”] Multinomial naive Bayes prediction method
priorClassEstimates (array) – [optional, default: None] Prior class estimates
alpha (array) – [optional, default: None] Imagined occurrences of the each word
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (multinomial_naive_bayes_modelptr) – Input model trained by the classification algorithm
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library SVM.
-Note: For the labels parameter, data is formatted as -1s and 1s
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the SVM training algorithm, double or float
method (str) – [optional, default: “boser”] SVM training method
C (double) – [optional, default: get_nan64()] Upper bound in constraints of the quadratic optimization problem
accuracyThreshold (double) – [optional, default: get_nan64()] Training accuracy
tau (double) – [optional, default: get_nan64()] Tau parameter of the working set selection scheme
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations for the algorithm
cacheSize (size_t) – [optional, default: -1] Size of cache in bytes to store values of the kernel matrix. A non-zero value enables use of a cache optimization technique
doShrinking (bool) – [optional, default: False] Flag that enables use of the shrinking optimization technique
shrinkingStep (size_t) – [optional, default: -1] Number of iterations between the steps of shrinking optimization technique
kernel (kernel_function_kerneliface__iface__) – [optional, default: None] Kernel function
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
fptype (str) – [optional, default: “double”]
method (str) – [optional, default: “defaultDense”]
C (double) – [optional, default: get_nan64()] Upper bound in constraints of the quadratic optimization problem
accuracyThreshold (double) – [optional, default: get_nan64()] Training accuracy
tau (double) – [optional, default: get_nan64()] Tau parameter of the working set selection scheme
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations for the algorithm
cacheSize (size_t) – [optional, default: -1] Size of cache in bytes to store values of the kernel matrix. A non-zero value enables use of a cache optimization technique
doShrinking (bool) – [optional, default: False] Flag that enables use of the shrinking optimization technique
shrinkingStep (size_t) – [optional, default: -1] Number of iterations between the steps of shrinking optimization technique
kernel (kernel_function_kerneliface__iface__) – [optional, default: None] Kernel function
nClasses (size_t) – [optional, default: -1] Number of classes
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (svm_modelptr) – Input model trained by the classification algorithm
Properties:
-Numpy array
-Numpy array
-Numpy array
-Properties:
-double
-Numpy array
-size_t
-size_t
-Numpy array
-Numpy array
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Logistic Regression.
-Examples:
- -nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for logistic regression, double or float
method (str) – [optional, default: “defaultDense”] logistic regression computation method
interceptFlag (bool) – [optional, default: False] Whether the intercept needs to be computed
penaltyL1 (float) – [optional, default: get_nan32()] L1 regularization coefficient. Default is 0 (not applied)
penaltyL2 (float) – [optional, default: get_nan32()] L2 regularization coefficient. Default is 0 (not applied)
optimizationSolver (optimization_solver_iterative_solver_batch__iface__) – [optional, default: None] Default is sgd momentum solver
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Training data set
labels (data_or_file) – Labels of the training data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
nClasses (size_t) – Number of classes
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the logistic regression algorithm, double or float
method (str) – [optional, default: “defaultDense”] logistic regression computation method
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data set
model (logistic_regression_modelptr) – Input model trained by the classification algorithm
See also Intel(R) oneAPI Data Analytics Library Regression.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Regression Decision Forest.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for decision forest model-based training, double or float
method (str) – [optional, default: “defaultDense”] decision forest training method
nTrees (size_t) – [optional, default: -1] Number of trees in the forest. Default is 10
observationsPerTreeFraction (double) – [optional, default: get_nan64()] Fraction of observations used for a training of one tree, 0 to 1. Default is 1 (sampling with replacement)
featuresPerNode (size_t) – [optional, default: -1] Number of features tried as possible splits per node. If 0 then sqrt(p) for classification, p/3 for regression, where p is the total number of features.
maxTreeDepth (size_t) – [optional, default: -1] Maximal tree depth. Default is 0 (unlimited)
minObservationsInLeafNode (size_t) – [optional, default: -1] Minimal number of observations in a leaf node. Default is 1 for classification, 5 for regression.
engine (engines_batchbase__iface__) – [optional, default: None] Engine for the random numbers generator used by the algorithms
impurityThreshold (double) – [optional, default: get_nan64()] Threshold value used as stopping criteria: if the impurity value in the node is smaller than the threshold then the node is not split anymore.
varImportance (str) – [optional, default: “”] Variable importance computation mode
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
memorySavingMode (bool) – [optional, default: False] If true then use memory saving (but slower) mode
bootstrap (bool) – [optional, default: False] If true then training set for a tree is a bootstrap of the whole training set
minObservationsInSplitNode (size_t) – [optional, default: -1] Minimal number of observations in a split node. Default 2
minWeightFractionInLeafNode (double) – [optional, default: get_nan64()] The minimum weighted fraction of the sum total of weights (of all the input observations) required to be at a leaf node, 0.0 to 0.5. Default is 0.0
minImpurityDecreaseInSplitNode (double) – [optional, default: get_nan64()] A node will be split if this split induces a decrease of the impurity greater than or equal to the value, non-negative. Default is 0.0
maxLeafNodes (size_t) – [optional, default: -1] Maximum number of leaf node. Default is 0 (unlimited)
maxBins (size_t) – [optional, default: -1] Used with ‘hist’ split finding method only. Maximal number of discrete bins to bucket continuous features. Default is 256. Increasing the number results in higher computation costs
minBinSize (size_t) – [optional, default: -1] Used with ‘hist’ split finding method only. Minimal number of observations in a bin. Default is 5
splitter (str) – [optional, default: “”] Sets node splitting method. Default is best
binningStrategy (str) – [optional, default: “”] Used with ‘hist’ split finding method only. Selects the strategy to group data points into bins. Allowed values are ‘quantiles’ (default), ‘averages’
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariable (data_or_file) – Values of the dependent variable for the input data
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for decision forest model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (decision_forest_regression_modelptr) – Trained decision tree model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Regression Decision Tree.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Decision tree model-based training, double or float
method (str) – [optional, default: “defaultDense”] Decision tree training method
pruning (str) – [optional, default: “”] Pruning method for Decision tree
maxTreeDepth (size_t) – [optional, default: -1] Maximum tree depth. 0 means unlimited depth.
minObservationsInLeafNodes (size_t) – [optional, default: -1] Minimum number of observations in the leaf node. Can be any positive number.
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariables (data_or_file) – Values of the dependent variable for the input data
dataForPruning (data_or_file) – Pruning data set
dependentVariablesForPruning (data_or_file) – Labels of the pruning data set
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set
Properties:
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for Decision tree model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
pruning (str) – [optional, default: “”] Pruning method for Decision tree
maxTreeDepth (size_t) – [optional, default: -1] Maximum tree depth. 0 means unlimited depth.
minObservationsInLeafNodes (size_t) – [optional, default: -1] Minimum number of observations in the leaf node. Can be any positive number.
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (decision_tree_regression_modelptr) – Trained decision tree model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Regression Gradient Boosted Tree.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for model-based training, double or float
method (str) – [optional, default: “defaultDense”] gradient boosted trees training method
loss (str) – [optional, default: “”] Loss function type
varImportance (str) – [optional, default: “”] 64 bit integer flag VariableImportanceModes that indicates the variable importance computation modes
splitMethod (str) – [optional, default: “”] Split finding method. Default is exact
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the gradient boosted trees training algorithm. Default is 50
maxTreeDepth (size_t) – [optional, default: -1] Maximal tree depth, 0 for unlimited. Default is 6
shrinkage (double) – [optional, default: get_nan64()] Learning rate of the boosting procedure. Scales the contribution of each tree by a factor (0, 1]. Default is 0.3
minSplitLoss (double) – [optional, default: get_nan64()] Loss regularization parameter. Min loss reduction required to make a further partition on a leaf node of the tree. Range: [0, inf). Default is 0
lambda (double) – [optional, default: get_nan64()] L2 regularization parameter on weights. Range: [0, inf). Default is 1
observationsPerTreeFraction (double) – [optional, default: get_nan64()] Fraction of observations used for a training of one tree, sampling without replacement. Range: (0, 1]. Default is 1 (no sampling, entire dataset is used)
featuresPerNode (size_t) – [optional, default: -1] Number of features tried as possible splits per node. Range : [0, p] where p is the total number of features. Default is 0 (use all features)
minObservationsInLeafNode (size_t) – [optional, default: -1] Minimal number of observations in a leaf node. Default is 5.
memorySavingMode (bool) – [optional, default: False] If true then use memory saving (but slower) mode. Default is false
engine (engines_batchbase__iface__) – [optional, default: None] Engine for the random numbers generator used by the algorithms
maxBins (size_t) – [optional, default: -1] Used with ‘inexact’ split finding method only. Maximal number of discrete bins to bucket continuous features. Default is 256. Increasing the number results in higher computation costs
minBinSize (size_t) – [optional, default: -1] Used with ‘inexact’ split finding method only. Minimal number of observations in a bin. Default is 5
internalOptions (int) – [optional, default: -1] Internal options
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariable (data_or_file) – Values of the dependent variable for the input data
Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
nIterations (size_t) – [optional, default: -1] Number of iterations of the trained model to be uses for prediction
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (gbt_regression_modelptr) – Trained gradient boosted trees model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Linear Regression.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for linear regression model-based training, double or float
method (str) – [optional, default: “normEqDense”] Linear regression training method
interceptFlag (bool) – [optional, default: False] Flag that indicates whether the intercept needs to be computed
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariables (data_or_file) – Values of the dependent variable for the input data
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for linear regression model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (linear_regression_modelptr) – Trained linear regression model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Least Absolute Shrinkage and Selection Operator.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for lasso regression model-based training, double or float
method (str) – [optional, default: “defaultDense”] LASSO regression training method
lassoParameters (array) – [optional, default: None] Numeric table that contains values of lasso parameters
optimizationSolver (optimization_solver_iterative_solver_batch__iface__) – [optional, default: None] Default is coordinate descent solver
dataUseInComputation (str) – [optional, default: “”] The flag allows to corrupt input data
optResultToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the optional results to compute
interceptFlag (bool) – [optional, default: False] Flag that indicates whether the intercept needs to be computed
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariables (data_or_file) – Values of the dependent variable for the input data
weights (data_or_file) – [optional, default: None] NumericTable of size 1 x n with weights of samples. Applied for all method
gramMatrix (data_or_file) – [optional, default: None] NumericTable of size p x p with last iteration number. Applied for all method
Properties:
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for lasso regression model-based prediction
method (str) – [optional, default: “defaultDense”]
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (lasso_regression_modelptr) – Trained lasso regression model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Ridge Regression.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for ridge regression model-based training, double or float
method (str) – [optional, default: “normEqDense”] Ridge regression training method
ridgeParameters (array) – [optional, default: None] Numeric table that contains values of ridge parameters
interceptFlag (bool) – [optional, default: False] Flag that indicates whether the intercept needs to be computed
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariables (data_or_file) – Values of the dependent variable for the input data
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for ridge regression model-based prediction
method (str) – [optional, default: “defaultDense”] Computation method in the batch processing mode
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (ridge_regression_modelptr) – Trained ridge regression model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Regression Stump.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the the decision stump training method, double or float
method (str) – [optional, default: “defaultDense”] Decision stump training method
varImportance (str) – [optional, default: “”] Variable importance mode. Variable importance computation is not supported for current version of the library
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
dependentVariables (data_or_file) – Values of the dependent variable for the input data
weights (data_or_file) – [optional, default: None] Optional. Weights of the observations in the training data set. Some values are skipped for backward compatibility.
Properties:
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the decision stump prediction algorithm, double or float
method (str) – [optional, default: “defaultDense”] Decision stump model-based prediction method
varImportance (str) – [optional, default: “”] Variable importance mode. Variable importance computation is not supported for current version of the library
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
model (stump_regression_modelptr) – Trained regression model
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library PCA.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for PCA, double or float
method (str) – [optional, default: “correlationDense”] PCA computation method
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
nComponents (size_t) – [optional, default: -1] number of components for reduced implementation
isDeterministic (bool) – [optional, default: False] sign flip if required
doScale (bool) – [optional, default: False] scaling if required
isCorrelation (bool) – [optional, default: False] correlation is provided
normalization (normalization_zscore_batchimpl__iface__) – [optional, default: None] Pointer to batch covariance
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
correlation (data_or_file) – [optional, default: None] Input correlation table
Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library PCA Transform.
-Examples:
- -fptype (str) – [optional, default: “double”]
method (str) – [optional, default: “defaultDense”]
nComponents (size_t) – [optional, default: -1]
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
eigenvectors (data_or_file) – Transformation matrix of eigenvectors
dataForTransform (dict_numerictableptr) – Data for transform
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library K-Means Clustering.
-Examples:
- -Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library K-Means Initialization.
-nClusters (size_t) – Number of clusters
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of initial clusters for K-Means algorithm, double or float
method (str) – [optional, default: “defaultDense”] Method of computing initial clusters for the algorithm
nTrials (size_t) – [optional, default: -1] Kmeans++ only. The number of trials to generate all clusters but the first initial cluster.
oversamplingFactor (double) – [optional, default: get_nan64()] Kmeans|| only. A fraction of nClusters being chosen in each of nRounds of kmeans||.L = nClusters* oversamplingFactor points are sampled in a round.
nRounds (size_t) – [optional, default: -1] Kmeans|| only. Number of rounds for k-means||. (oversamplingFactor*nRounds) > 1 is a requirement.
engine (engines_batchbase__iface__) – [optional, default: None] Engine to be used for generating random numbers for the initialization
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library K-Means Computation.
-nClusters (size_t) – Number of clusters
maxIterations (size_t) – Number of iterations
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of K-Means, double or float
method (str) – [optional, default: “lloydDense”] Computation method of the algorithm
accuracyThreshold (double) – [optional, default: get_nan64()] Threshold for the termination of the algorithm
gamma (double) – [optional, default: get_nan64()] Weight used in distance computation for categorical features
distanceType (str) – [optional, default: “”] Distance used in the algorithm
resultsToEvaluate (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
assignFlag (bool) – [optional, default: False] Do data points assignment :param bool distributed: [optional, default: False] enable distributed computation (SPMD)
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
inputCentroids (data_or_file) – Initial centroids for the algorithm
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Density-Based Spatial Clustering of Applications with Noise.
-Examples:
- -epsilon (double) – Radius of neighborhood
minObservations (size_t) – Minimal total weight of observations in neighborhood of core observation
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of DBSCAN, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the algorithm
memorySavingMode (bool) – [optional, default: False] If true then use memory saving (but slower) mode
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
blockIndex (size_t) – [optional, default: -1] Unique identifier of block initially passed for computation on the local node
nBlocks (size_t) – [optional, default: -1] Number of blocks initially passed for computation on all nodes
leftBlocks (size_t) – [optional, default: -1] Number of blocks that will process observations with value of selected split feature lesser than selected split value
rightBlocks (size_t) – [optional, default: -1] Number of blocks that will process observations with value of selected split feature greater than selected split value
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
weights (data_or_file) – [optional, default: None] Input weights of observations
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Multivariate Outlier Detection.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the multivariate outlier detection, double or float
method (str) – [optional, default: “defaultDense”] Multivariate outlier detection computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
location (data_or_file) – [optional, default: None] Vector of mean estimates of size 1 x p
scatter (data_or_file) – [optional, default: None] Measure of spread, the variance-covariance matrix of size p x p
threshold (data_or_file) – [optional, default: None] Limit that defines the outlier region, the array of size 1 x 1 containing a non-negative number
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Univariate Outlier Detection.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the univariate outlier detection algorithm, double or float
method (str) – [optional, default: “defaultDense”] univariate outlier detection computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
location (data_or_file) – [optional, default: None] Vector of mean estimates of size 1 x p
scatter (data_or_file) – [optional, default: None] Measure of spread, the array of standard deviations of size 1 x p
threshold (data_or_file) – [optional, default: None] Limit that defines the outlier region, the array of non-negative numbers of size 1 x p
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Multivariate Bacon Outlier Detection.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the BACON outlier detection, double or float
method (str) – [optional, default: “defaultDense”] BACON outlier detection computation method
initMethod (str) – [optional, default: “”] Initialization method
alpha (double) – [optional, default: get_nan64()] One-tailed probability that defines the (1 - lpha) quantile of the chi^2 distribution with p degrees of freedom. Recommended value: lpha / n, where n is the number of observations.
toleranceToConverge (double) – [optional, default: get_nan64()] Stopping criterion: the algorithm is terminated if the size of the basic subset is changed by less than the threshold
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library MSE.
-Examples:
-numberOfTerms (size_t) – The number of terms in the function
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Mean squared error objective function, double or float
method (str) – [optional, default: “defaultDense”] The Mean squared error objective function computation method
interceptFlag (bool) – [optional, default: False] Whether the intercept needs to be computed. Default is true
penaltyL1 (array) – [optional, default: None] L1 regularization coefficients. Default is 0 (not applied)
penaltyL2 (array) – [optional, default: None] L2 regularization coefficients. Default is 0 (not applied)
batchIndices (array) – [optional, default: None] Numeric table of size 1 x m where m is batch size that represent a batch of indices used to compute the function results, e.g., value of the sum of the functions. If no indices are provided, all terms will be used in the computations.
featureId (size_t) – [optional, default: -1] The feature index to compute part of gradient/hessian/proximal projection
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
weights (data_or_file) – NumericTable of size 1 x n with samples weights. Applied for all method
gramMatrix (data_or_file) – NumericTable of size p x p with last iteration number. Applied for all method
optimization_solver_objective_function_result
-Setup (partial) input data for using algorithm object in other algorithms.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
weights (data_or_file) – NumericTable of size 1 x n with samples weights. Applied for all method
gramMatrix (data_or_file) – NumericTable of size p x p with last iteration number. Applied for all method
None
-alias of optimization_solver_objective_function_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Logistic Loss.
-Examples:
-numberOfTerms (size_t) – The number of terms in the function
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Logistic loss objective function, double or float
method (str) – [optional, default: “defaultDense”] The Logistic loss objective function computation method
interceptFlag (bool) – [optional, default: False] Whether the intercept needs to be computed. Default is true
penaltyL1 (float) – [optional, default: get_nan32()] L1 regularization coefficient. Default is 0 (not applied)
penaltyL2 (float) – [optional, default: get_nan32()] L2 regularization coefficient. Default is 0 (not applied)
batchIndices (array) – [optional, default: None] Numeric table of size 1 x m where m is batch size that represent a batch of indices used to compute the function results, e.g., value of the sum of the functions. If no indices are provided, all terms will be used in the computations.
featureId (size_t) – [optional, default: -1] The feature index to compute part of gradient/hessian/proximal projection
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
optimization_solver_objective_function_result
-Setup (partial) input data for using algorithm object in other algorithms.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
None
-alias of optimization_solver_objective_function_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Cross Entropy Loss.
-Examples:
-nClasses (size_t) – Number of classes (different values of dependent variable)
numberOfTerms (size_t) – The number of terms in the function
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Cross-entropy loss objective function, double or float
method (str) – [optional, default: “defaultDense”] The Cross-entropy loss objective function computation method
interceptFlag (bool) – [optional, default: False] Whether the intercept needs to be computed. Default is true
penaltyL1 (float) – [optional, default: get_nan32()] L1 regularization coefficient. Default is 0 (not applied)
penaltyL2 (float) – [optional, default: get_nan32()] L2 regularization coefficient. Default is 0 (not applied)
batchIndices (array) – [optional, default: None] Numeric table of size 1 x m where m is batch size that represent a batch of indices used to compute the function results, e.g., value of the sum of the functions. If no indices are provided, all terms will be used in the computations.
featureId (size_t) – [optional, default: -1] The feature index to compute part of gradient/hessian/proximal projection
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
Do the actual computation on provided input data.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
optimization_solver_objective_function_result
-Setup (partial) input data for using algorithm object in other algorithms.
-data (data_or_file) – Numeric table of size n x p with data
dependentVariables (data_or_file) – Numeric table of size n x 1 with dependent variables
argument (data_or_file) – Numeric table of size 1 x p with input argument of the objective function
None
-alias of optimization_solver_objective_function_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library SGD.
-Examples:
- -function (optimization_solver_sum_of_functions_batch__iface__) – Objective function represented as sum of functions
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Stochastic gradient descent algorithm,
method (str) – [optional, default: “defaultDense”] Stochastic gradient descent computation method
batchIndices (array) – [optional, default: None] Numeric table that represents 32 bit integer indices of terms in the objective function. If no indices are provided, the implementation will generate random indices.
learningRateSequence (array) – [optional, default: None] Numeric table that contains values of the learning rate sequence
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random generation of 32 bit integer indices of terms in the objective function.
nIterations (size_t) – [optional, default: -1] Maximal number of iterations of the algorithm
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the algorithm. The algorithm terminates when this accuracy is achieved
optionalResultRequired (bool) – [optional, default: False] Indicates whether optional result is required
batchSize (size_t) – [optional, default: -1] Number of batch indices to compute the stochastic gradient. If batchSize is equal to the number of terms in objective function then no random sampling is performed, and all terms are used to calculate the gradient. This parameter is ignored if batchIndices is provided.
conservativeSequence (array) – [optional, default: None] Numeric table of values of the conservative coefficient sequence
innerNIterations (size_t) – [optional, default: -1]
momentum (double) – [optional, default: get_nan64()] Momentum value
Do the actual computation on provided input data.
-inputArgument (data_or_file) – Initial value to start optimization
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library LBFGS.
-Examples:
-function (optimization_solver_sum_of_functions_batch__iface__) – Objective function represented as sum of functions
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the LBFGS algorithm,
method (str) – [optional, default: “defaultDense”] LBFGS computation method
m (size_t) – [optional, default: -1] Memory parameter of LBFGS. The maximum number of correction pairs that define the approximation of inverse Hessian matrix.
L (size_t) – [optional, default: -1] The number of iterations between the curvature estimates calculations
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random choosing terms from objective function.
batchIndices (array) – [optional, default: None]
correctionPairBatchSize (size_t) – [optional, default: -1] Number of observations to compute the sub-sampled Hessian for correction pairs computation
correctionPairBatchIndices (array) – [optional, default: None]
stepLengthSequence (array) – [optional, default: None]
nIterations (size_t) – [optional, default: -1] Maximal number of iterations of the algorithm
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the algorithm. The algorithm terminates when this accuracy is achieved
optionalResultRequired (bool) – [optional, default: False] Indicates whether optional result is required
batchSize (size_t) – [optional, default: -1] Number of batch indices to compute the stochastic gradient. If batchSize is equal to the number of terms in objective function then no random sampling is performed, and all terms are used to calculate the gradient. This parameter is ignored if batchIndices is provided.
Do the actual computation on provided input data.
-inputArgument (data_or_file) – Initial value to start optimization
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library AdaGrad.
-Examples:
-function (optimization_solver_sum_of_functions_batch__iface__) – Objective function represented as sum of functions
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Adaptive gradient descent algorithm,
method (str) – [optional, default: “defaultDense”] Adaptive gradient descent computation method
batchIndices (array) – [optional, default: None] Numeric table that represents 32 bit integer indices of terms in the objective function. If no indices are provided, the implementation will generate random indices.
learningRate (array) – [optional, default: None] Numeric table that contains value of the learning rate
degenerateCasesThreshold (double) – [optional, default: get_nan64()] Value needed to avoid degenerate cases in square root computing.
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random generation of 32 bit integer indices of terms in the objective function.
nIterations (size_t) – [optional, default: -1] Maximal number of iterations of the algorithm
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the algorithm. The algorithm terminates when this accuracy is achieved
optionalResultRequired (bool) – [optional, default: False] Indicates whether optional result is required
batchSize (size_t) – [optional, default: -1] Number of batch indices to compute the stochastic gradient. If batchSize is equal to the number of terms in objective function then no random sampling is performed, and all terms are used to calculate the gradient. This parameter is ignored if batchIndices is provided.
Do the actual computation on provided input data.
-inputArgument (data_or_file) – Initial value to start optimization
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Stochastic Average Gradient Descent SAGA.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Stochastic average gradient descent algorithm,
method (str) – [optional, default: “defaultDense”] Stochastic average gradient descent computation method
batchIndices (array) – [optional, default: None] Numeric table that represents 32 bit integer indices of terms in the objective function. If no indices are provided, the implementation will generate random indices.
learningRateSequence (array) – [optional, default: None] Numeric table that contains value of the learning rate
engine (engines_batchbase__iface__) – [optional, default: None] Engine for random generation of 32 bit integer indices of terms in the objective function.
function (optimization_solver_sum_of_functions_batch__iface__) – [optional, default: None] Objective function represented as sum of functions
nIterations (size_t) – [optional, default: -1] Maximal number of iterations of the algorithm
accuracyThreshold (double) – [optional, default: get_nan64()] Accuracy of the algorithm. The algorithm terminates when this accuracy is achieved
optionalResultRequired (bool) – [optional, default: False] Indicates whether optional result is required
batchSize (size_t) – [optional, default: -1] Number of batch indices to compute the stochastic gradient. If batchSize is equal to the number of terms in objective function then no random sampling is performed, and all terms are used to calculate the gradient. This parameter is ignored if batchIndices is provided.
Do the actual computation on provided input data.
-inputArgument (data_or_file) – Initial value to start optimization
gradientsTable (data_or_file) – Numeric table of size p x 1 with the values of G, where each value is an accumulated sum of squares of corresponding gradient’s coordinate values.
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Cosine Distance.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the cosine distance, double or float
method (str) – [optional, default: “defaultDense”] Cosine distance computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Correlation Distance.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the correlation distance algorithm, double or float
method (str) – [optional, default: “defaultDense”] Correlation distance computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Expectation-Maximization.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Expectation-Maximization Initialization.
-Examples:
- -nComponents (size_t) – Number of components in the Gaussian mixture model
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of initial values for the EM for GMM algorithm, double or float
method (str) – [optional, default: “defaultDense”]
nTrials (size_t) – [optional, default: -1] Number of trials of short EM runs
nIterations (size_t) – [optional, default: -1] Number of iterations in every short EM run
accuracyThreshold (double) – [optional, default: get_nan64()] Threshold for the termination of the algorithm
covarianceStorage (str) – [optional, default: “”] Type of covariance in the Gaussian mixture model.
engine (engines_batchbase__iface__) – [optional, default: None] Engine to be used for randomly generating data points to start the initialization of short EM
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Expectation-Maximization for the Gaussian Mixture Model.
-Examples:
- -nComponents (size_t) – Number of components in the Gaussian mixture model
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the EM for GMM algorithm, double or float
method (str) – [optional, default: “defaultDense”] EM for GMM computation method
maxIterations (size_t) – [optional, default: -1] Maximal number of iterations of the algorithm.
accuracyThreshold (double) – [optional, default: get_nan64()] Threshold for the termination of the algorithm.
regularizationFactor (double) – [optional, default: get_nan64()] Factor for covariance regularization in case of ill-conditional data
covarianceStorage (str) – [optional, default: “”] Type of covariance in the Gaussian mixture model.
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
inputWeights (data_or_file) – Input weights
inputMeans (data_or_file) – Input means
inputCovariances (list_numerictableptr) – Collection of input covariances
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library QR Decomposition.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library QR Decomposition without pivoting.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the QR decomposition algorithm, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the algorithm
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Pivoted QR Decomposition.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of the pivoted QR algorithm, double or float
method (str) – [optional, default: “defaultDense”] Computation method
permutedColumns (array) – [optional, default: None] On entry, if i-th element of permutedColumns != 0, * the i-th column of input matrix is moved to the beginning of Data * P before * the computation, and fixed in place during the computation. * If i-th element of permutedColumns = 0, the i-th column of input data * is a free column (that is, it may be interchanged during the * computation with any other free column).
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Normalization.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Z-Score.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the z-score normalization, double or float
method (str) – [optional, default: “defaultDense”] Z-score normalization computation method
resultsToCompute (str) – [optional, default: “”] 64 bit integer flag that indicates the results to compute
doScale (bool) – [optional, default: False] boolean flag that indicates the mode of computation. If true both centering and scaling, otherwise only centering.
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Min-Max.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the min-max normalization, double or float
method (str) – [optional, default: “defaultDense”] Min-max normalization computation method
lowerBound (double) – [optional, default: get_nan64()] The lower bound of the features value will be obtained during normalization.
upperBound (double) – [optional, default: get_nan64()] The upper bound of the features value will be obtained during normalization.
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Engines.
- - -Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library mt19937.
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of mt19937 engine, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the engine
seed (size_t) – [optional, default: -1] seed
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-alias of engines_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library mt2203.
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of mt2203 engine, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the engine
seed (size_t) – [optional, default: -1] seed
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-alias of engines_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library mcg59.
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of mcg59 engine, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the engine
seed (size_t) – [optional, default: -1] seed
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-alias of engines_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Distributions.
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Bernoulli Distribution.
-Examples:
- -p (double) – Success probability of a trial, value from [0.0; 1.0]
fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of bernoulli distribution, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the distribution
engine (engines_batchbase__iface__) – [optional, default: None] Pointer to the engine
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-distributions_result
-alias of distributions_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Normal Distribution.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of normal distribution, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the distribution
a (double) – [optional, default: get_nan64()] Mean
sigma (double) – [optional, default: get_nan64()] Standard deviation
engine (engines_batchbase__iface__) – [optional, default: None] Pointer to the engine
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-distributions_result
-alias of distributions_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Uniform Distribution.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of uniform distribution, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the distribution
a (double) – [optional, default: get_nan64()] Left bound a
b (double) – [optional, default: get_nan64()] Right bound b
engine (engines_batchbase__iface__) – [optional, default: None] Pointer to the engine
Do the actual computation on provided input data.
-tableToFill (data_or_file) – Input table to fill with random numbers
-distributions_result
-alias of distributions_result
Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Association Rules.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the association rules algorithm, double or float
method (str) – [optional, default: “apriori”] Association rules algorithm computation method
minSupport (double) – [optional, default: get_nan64()] Minimum support 0.0 <= minSupport < 1.0
minConfidence (double) – [optional, default: get_nan64()] Minimum confidence 0.0 <= minConfidence < 1.0
nUniqueItems (size_t) – [optional, default: -1] Number of unique items
nTransactions (size_t) – [optional, default: -1] Number of transactions
discoverRules (bool) – [optional, default: False] Flag. If true, association rules are built from large itemsets
itemsetsOrder (str) – [optional, default: “”] Format of the resulting itemsets
rulesOrder (str) – [optional, default: “”] Format of the resulting association rules
minItemsetSize (size_t) – [optional, default: -1] Minimum number of items in a large itemset
maxItemsetSize (size_t) – [optional, default: -1] Maximum number of items in a large itemset. Set to zero to not limit the upper boundary for the size of large itemsets
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Cholesky Decomposition.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the Cholesky decomposition algorithm,
method (str) – [optional, default: “defaultDense”] Cholesky decomposition computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Correlation and Variance-Covariance Matrices.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of the correlation or variance-covariance matrix, double or float
method (str) – [optional, default: “defaultDense”] Computation method
outputMatrixType (str) – [optional, default: “”] Type of the computed matrix
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Implicit Alternating Least Squares.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for implicit ALS model training, double or float
method (str) – [optional, default: “defaultDense”] Implicit ALS training method
nFactors (size_t) – [optional, default: -1] Number of factors
maxIterations (size_t) – [optional, default: -1] Maximum number of iterations of the implicit ALS training algorithm
alpha (double) – [optional, default: get_nan64()] Confidence parameter of the implicit ALS training algorithm
lambda (double) – [optional, default: get_nan64()] Regularization parameter
preferenceThreshold (double) – [optional, default: get_nan64()] Threshold used to define preference values
Do the actual computation on provided input data.
-data (data_or_file) – Input data table that contains ratings
inputModel (implicit_als_modelptr) – Initial model that contains initialized factors
Properties:
-Numpy array
-Numpy array
-fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for implicit ALS model-based prediction, double or float
method (str) – [optional, default: “defaultDense”] Implicit ALS prediction method
nFactors (size_t) – [optional, default: -1] Number of factors
maxIterations (size_t) – [optional, default: -1] Maximum number of iterations of the implicit ALS training algorithm
alpha (double) – [optional, default: get_nan64()] Confidence parameter of the implicit ALS training algorithm
lambda (double) – [optional, default: get_nan64()] Regularization parameter
preferenceThreshold (double) – [optional, default: get_nan64()] Threshold used to define preference values
Do the actual computation on provided input data.
-model (implicit_als_modelptr) – Input model trained by the ALS algorithm
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Moments of Low Order.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations of the low order moments, double or float
method (str) – [optional, default: “defaultDense”] Computation method of the algorithm
estimatesToCompute (str) – [optional, default: “”] Estimates to be computed by the algorithm
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Properties:
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Numpy array
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Quantiles.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the quantile algorithms, double or float
method (str) – [optional, default: “defaultDense”] Quantiles computation method
quantileOrders (array) – [optional, default: None] Numeric table with quantile orders. Default value is 0.5 (median)
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library SVD.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the SVD algorithm, double or float
method (str) – [optional, default: “defaultDense”] SVD computation method
leftSingularMatrix (str) – [optional, default: “”] Format of the matrix of left singular vectors >
rightSingularMatrix (str) – [optional, default: “”] Format of the matrix of right singular vectors >
distributed (bool) – [optional, default: False] enable distributed computation (SPMD)
streaming (bool) – [optional, default: False] enable streaming
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Parameters and semantics are described in Intel(R) oneAPI Data Analytics Library Sorting.
-Examples:
- -fptype (str) – [optional, default: “double”] Data type to use in intermediate computations for the sorting, double or float
method (str) – [optional, default: “defaultDense”] Sorting computation method
Do the actual computation on provided input data.
-data (data_or_file) – Input data table
-Examples:
- -The daal4py algorithms documentation has moved. You should be redirected automatically to the API reference. If not, please visit:
+ - \ No newline at end of file + diff --git a/daal4py/contents.html b/daal4py/contents.html old mode 100755 new mode 100644 index 0312250..e2a7296 --- a/daal4py/contents.html +++ b/daal4py/contents.html @@ -1,218 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-Contents:
-The daal4py documentation has moved. You should be redirected automatically. If not, please visit:
+ - \ No newline at end of file + diff --git a/daal4py/data.html b/daal4py/data.html old mode 100755 new mode 100644 index 32dc657..1fd8f9b --- a/daal4py/data.html +++ b/daal4py/data.html @@ -1,176 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-All array arguments to compute functions and to algorithm constructors can be -provided in different formats. daal4py will automatically do its best to work on -the provided data with minimal overhead, most notably without copying the data.
-daal4py can directly handle all types of numpy arrays with numerical data -without copying the entire data. Arrays can be homogeneous (e.g. simple dtype) or -heterogeneous (structured array) as well as contiguous or non-contiguous.
-daal4py directly accepts pandas DataFrames with columns of numerical data. No -extra full copy is required.
-daal4py can directly handle matrices of type scipy.sparse.csr_matrix without -copying the entire data.
-Note: some algorithms can be configured to use an optimized compute path for CSR -data. It is required to explicitly specify the CSR method, otherwise the default -and less efficient method is used.
-The compute functions daal4py’s algorithms additionally accept -CSV-filenames. Internally, daal4py will use DAAL’s fast CSV reader to create -contiguous homogeneous tables.
-The data handling documentation has moved. You should be redirected automatically to the API reference. If not, please visit:
+ - \ No newline at end of file + diff --git a/daal4py/examples.html b/daal4py/examples.html old mode 100755 new mode 100644 index 7a83945..54d979c --- a/daal4py/examples.html +++ b/daal4py/examples.html @@ -1,287 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-Below are examples on how to utilize daal4py for various usage styles.
-Building models from Gradient Boosting frameworks
- -Principal Component Analysis (PCA) Transform
- -Singular Value Decomposition (SVD)
- -Moments of Low Order
- -Correlation and Variance-Covariance Matrices
- -Decision Forest Classification
-Single-Process Decision Forest Classification Default Dense method
Single-Process Decision Forest Classification Histogram method
Decision Tree Classification
- -Gradient Boosted Classification
- -k-Nearest Neighbors (kNN)
- -Multinomial Naive Bayes
- -Support Vector Machine (SVM)
- -Logistic Regression
- -Decision Forest Regression
- -Gradient Boosted Regression
- -Linear Regression
- -Ridge Regression
- -K-Means Clustering
- -Multivariate Outlier Detection
- -Univariate Outlier Detection
- -Optimization Solvers-Mean Squared Error Algorithm (MSE)
- -Logistic Loss
- -Stochastic Gradient Descent Algorithm
-Limited-Memory Broyden-Fletcher-Goldfarb-Shanno Algorithm
- -Adaptive Subgradient Method
- -Cosine Distance Matrix
- -Correlation Distance Matrix
- -Trees
- -The examples documentation has moved. You should be redirected automatically. If not, please visit:
+ - \ No newline at end of file + diff --git a/daal4py/genindex.html b/daal4py/genindex.html old mode 100755 new mode 100644 index 54c6a39..060ef5c --- a/daal4py/genindex.html +++ b/daal4py/genindex.html @@ -1,1287 +1,14 @@ - + - - -| - | - |
| - | - |
| - | - |
| - | - |
| - | - |
| - | - |
| - |
| - | - |
| - | - |
The daal4py index has moved. You should be redirected automatically to the API reference. If not, please visit:
+ - \ No newline at end of file + diff --git a/daal4py/index.html b/daal4py/index.html index 56fad40..0f067bc 100755 --- a/daal4py/index.html +++ b/daal4py/index.html @@ -1,333 +1,15 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-Daal4py makes your Machine Learning algorithms in Python lightning fast and easy to use. It provides -highly configurable Machine Learning kernels, some of which support streaming input data and/or can -be easily and efficiently scaled out to clusters of workstations. Internally it uses Intel(R) -oneAPI Data Analytics Library to deliver the best performance.
-daal4py was created to give data scientists the easiest way to utilize Intel(R) oneAPI Data Analytics -Library powerful machine learning building blocks directly in a high-productivity manner. A -simplified API gives high-level abstractions to the user with minimal boilerplate, allowing for -quick to write and easy to maintain code when utilizing Jupyter Notebooks. For scaling capabilities, -daal4py also provides the ability to do distributed machine learning, giving a quick way to scale -out. Its streaming mode provides a flexible mechanism for processing large amounts of data and/or -non-contiguous input data.
-For framework designers, daal4py has been fashioned to be built under other frameworks from both an -API and feature perspective. The machine learning models split the training and inference classes, -allowing the model to be exported and serialized if desired. This design also gives the flexibility -to work directly with the model and associated primitives, allowing one to customize the behavior of -the model itself. The daal4py package can be built with customized algorithm loadouts, allowing for -a smaller footprint of dependencies when necessary.
-As an example of the type of API that would be used in a data science context, -the linear regression workflow is showcased below:
-import daal4py as d4p
-# train, test, and target are Pandas dataframes
-
-d4p_lm = d4p.linear_regression_training(interceptFlag=True)
-lm_trained = d4p_lm.compute(train, target)
-
-lm_predictor_component = d4p.linear_regression_prediction()
-result = lm_predictor_component.compute(test, lm_trained.model)
-In the example above, it can be seen that model is divided into training and -prediction. This gives flexibility when writing custom grid searches and custom -functions that modify model behavior or use it as a parameter. Daal4py also -allows for direct usage of NumPy arrays and pandas DataFrames instead of oneDAL -NumericTables, which allow for better integration with the pandas/NumPy/SciPy stack.
-Daal4py machine learning algorithms are constructed with a rich set of -parameters. Assuming we want to find the initial set of centroids for kmeans, -we first create an algorithm and configure it for 10 clusters using the ‘PlusPlus’ method:
-kmi = kmeans_init(10, method="plusPlusDense")
-Assuming we have all our data in a CSV file we can now call it:
-result = kmi.compute('data.csv')
-Our result will hold the computed centroids in the ‘centroids’ attribute:
-print(result.centroids)
-The full example could look like this:
-from daal4py import kmeans_init
-result = kmeans_init(10, method="plusPlusDense").compute('data.csv')
-print(result.centroids)
-One can even run this on a cluster by simply -adding initializing/finalizing the network and adding a keyword-parameter:
-from daal4py import daalinit, daalfini, kmeans_init
-daalinit()
-result = kmeans_init(10, method="plusPlusDense", distributed=True).compute(my_file)
-daalfini()
-Last but not least, daal4py allows getting input data from streams:
-from daal4py import svd
-algo = svd(streaming=True)
-for input in stream_or_filelist:
- algo.compute(input)
-result = algo.finalize()
-daal4py oneAPI and GPU support is deprecated. Use scikit-learn-intelex -instead.
-The design of daal4py utilizes several different technologies to deliver Intel(R) oneAPI Data -Analytics Library performance in a flexible design to Data Scientists and Framework designers. The -package uses Jinja templates to generate Cython-wrapped oneDAL C++ headers, with Cython as a bridge -between the generated oneDAL code and the Python layer. This design allows for quicker development -cycles and acts as a reference design to those looking to tailor their build of daal4py. Cython -also allows for good Python behavior, both for compatibility to different frameworks and for -pickling and serialization.
-Besides superior (e.g. close to native C++ Intel(R) oneAPI Data Analytics Library) performance on a -single node, the distribution mechanics of daal4py provides excellent strong and weak scaling. It -nicely handles distributing a fixed input size on increasing clusters sizes (strong scaling: orange) -which addresses possible response time requirements. It also scales with growing input size (weak -scaling: yellow) which is needed if the data no longer fits into memory of a single node.
-
-On a 32-node cluster (1280 cores) daal4py computed linear regression -of 2.15 TB of data in 1.18 seconds and 68.66 GB of data in less than -48 milliseconds.
-
-On a 32-node cluster (1280 cores) daal4py computed K-Means (10 -clusters) of 1.12 TB of data in 107.4 seconds and 35.76 GB of data -in 4.8 seconds.
-Configuration: Intel(R) Xeon(R) Gold 6148 CPU @ 2.40GHz, EIST/Turbo on 2 -sockets, 20 cores per socket, 192 GB RAM, 16 nodes connected with Infiniband, -Oracle Linux Server release 7.4, using 64-bit floating point numbers
-daal4py is available at the Python Package Index, -on Anaconda Cloud in Conda Forge channel -and in Intel channel. -Sources and build instructions are available in -daal4py repository.
-The daal4py package is available via same distribution channels and platforms as scikit-learn-intelex. -See -scikit-learn-intelex requirements <https://intel.github.io/scikit-learn-intelex/latest/system-requirements.html> _
-Install from PyPI:
-pip install daal4py
-Install from Anaconda Cloud: Conda-Forge channel:
-сonda install daal4py -c conda-forge
-Install using conda from the Intel repository:
-conda install daal4py -c https://software.repos.intel.com/python/conda/
-We recommend to use PyPi. If you are using Intel® Distribution for Python, -we recommend using conda from the Intel Repository. -In other cases, use Anaconda Cloud: conda-forge channel.
-All algorithms in daal4py work the same way:
-Instantiate and parameterize
Run/compute on input data
The below tables list the accepted arguments. Those with no default (None) are
-required arguments. All other arguments with defaults are optional and can be
-provided as keyword arguments (like optarg=77). Each algorithm returns a
-class-like object with properties as its result.
For algorithms with training and prediction, simply extract the model
-property from the result returned by the training and pass it in as the (second)
-input argument.
Note that all input objects and the result/model properties are native types, -e.g. standard types (integer, float, Numpy arrays, Pandas DataFrames, -…). Additionally, if you provide the name of a csv-file as an input argument -daal4py will work on the entire file content.
-Tip
-We recommend using -the ‘scikit-learn-intelex package patching <https://intel.github.io/scikit-learn-intelex/latest/what-is-patching.html>’ _ for the scikit-learn patching.
-daal4py exposes some oneDAL solvers using a scikit-learn compatible API.
-daal4py can furthermore monkey-patch the sklearn package to use the DAAL
-solvers as drop-in replacement without any code change.
Please refer to the section on scikit-learn API and patching -for more details.
-The daal4py documentation has moved. You should be redirected automatically. If not, please visit:
+https://uxlfoundation.github.io/scikit-learn-intelex/2025.5/about_daal4py.html
+Note: daal4py is now part of the scikit-learn-intelex package and has been deprecated in favor of sklearnex.
- \ No newline at end of file + diff --git a/daal4py/model-builders.html b/daal4py/model-builders.html index b927b07..7926fcd 100644 --- a/daal4py/model-builders.html +++ b/daal4py/model-builders.html @@ -1,273 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-Gradient boosting on decision trees is one of the most accurate and efficient -machine learning algorithms for classification and regression. -The most popular implementations of it are:
-XGBoost*
LightGBM*
CatBoost*
daal4py Model Builders deliver the accelerated -models inference of those frameworks. The inference is performed by the oneDAL GBT implementation tuned -for the best performance on the Intel(R) Architecture.
-Note
-Currently, experimental support for XGBoost* and LightGBM* categorical data is not supported. -For the model conversion to work with daal4py, convert non-numeric data to numeric data -before training and converting the model.
-The first step is to convert already trained model. The -API usage for different frameworks is the same:
-XGBoost:
-import daal4py as d4p
-d4p_model = d4p.mb.convert_model(xgb_model)
-LightGBM:
-import daal4py as d4p
-d4p_model = d4p.mb.convert_model(lgb_model)
-CatBoost:
-import daal4py as d4p
-d4p_model = d4p.mb.convert_model(cb_model)
-Note
-Convert model only once and then use it for the inference.
-The API is the same for classification and regression inference.
-Based on the original model passed to the convert_model(), d4p_prediction is either the classification or regression output.
----d4p_prediction = d4p_model.predict(test_data) -
Here, the predict() method of d4p_model is being used to make predictions on the test_data dataset.
-The d4p_prediction variable stores the predictions made by the predict() method.
SHAP contribution and interaction value calculation are natively supported by models created with daal4py Model Builders.
-For these models, the predict() method takes additional keyword arguments:
----d4p_model.predict(test_data, pred_contribs=True) # for SHAP contributions -d4p_model.predict(test_data, pred_interactions=True) # for SHAP interactions -
The returned prediction has the shape:
----
-- -
(n_rows, n_features + 1)for SHAP contributions- -
(n_rows, n_features + 1, n_features + 1)for SHAP interactions
Here, n_rows is the number of rows (i.e., observations) in
-test_data, and n_features is the number of features in the dataset.
The prediction result for SHAP contributions includes a feature attribution value for each feature and a bias term for each observation.
-The prediction result for SHAP interactions comprises (n_features + 1) x (n_features + 1) values for all possible
-feature combinations, along with their corresponding bias terms.
Note
-The shapes of SHAP contributions and interactions are consistent with the XGBoost results. -In contrast, the SHAP Python package drops bias terms, resulting -in SHAP contributions (SHAP interactions) with one fewer column (one fewer column and row) per observation.
-You can also use the scikit-learn-style classes GBTDAALClassifier and GBTDAALRegressor to convert and infer your models. For example:
from daal4py.sklearn.ensemble import GBTDAALRegressor
-reg = xgb.XGBRegressor()
-reg.fit(X, y)
-d4p_predt = GBTDAALRegressor.convert_model(reg).predict(X)
-Model Builders support only base inference with prediction and probabilities prediction. The functionality is to be extended. -Therefore, there are the following limitations: -- The categorical features are not supported for conversion and prediction. -- The multioutput models are not supported for conversion and prediction. -- SHAP values can be calculated for regression models only.
-Model Builders models conversion
- -The model builders documentation has moved. You should be redirected automatically. If not, please visit:
+Serving GBT Models from Other Libraries
- \ No newline at end of file + diff --git a/daal4py/objects.inv b/daal4py/objects.inv deleted file mode 100755 index 052223d..0000000 Binary files a/daal4py/objects.inv and /dev/null differ diff --git a/daal4py/scaling.html b/daal4py/scaling.html old mode 100755 new mode 100644 index a06d5eb..4c51fdc --- a/daal4py/scaling.html +++ b/daal4py/scaling.html @@ -1,243 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-daal4py operates in SPMD style (Single Program Multiple Data), which means your -program is executed on several processes (e.g. similar to MPI). The use of MPI is -not required for daal4py’s SPMD-mode to work, all necessary communication and -synchronization happens under the hood of daal4py. It is possible to use daal4py and -mpi4py in the same program, though.
-Only very minimal changes are needed to your daal4py code to allow daal4py to -run on a cluster of workstations. Initialize the distribution engine:
-daalinit()
-Add the distribution parameter to the algorithm construction:
-kmi = kmeans_init(10, method="plusPlusDense", distributed=True)
-When calling the actual computation each process expects an input file or input -array/DataFrame. Your program needs to tell each process which -file/array/DataFrame it should operate on. Like with other SPMD programs this is -usually done conditionally on the process id/rank (‘daal4py.my_procid()’). Assume -we have one file for each process, all having the same prefix ‘file’ and being -suffixed by a number. The code could then look like this:
-result = kmi.compute("file{}.csv", daal4py.my_procid())
-The result of the computation will now be available on all processes.
-Finally stop the distribution engine:
-daalfini()
-That’s all for the python code:
-from daal4py import daalinit, daalfini, kmeans_init
-daalinit()
-kmi = kmeans_init(10, method="plusPlusDense", distributed=True)
-result = kmi.compute("file{}.csv", daal4py.my_procid())
-daalfini()
-To actually get it executed on several processes use standard MPI mechanics, -like:
-mpirun -n 4 python ./kmeans.py
-The binaries provided by Intel use the Intel® MPI library, but -daal4py can also be compiled for any other MPI implementation.
-The following algorithms support distribution:
-PCA (pca)
-SVD (svd)
-Linear Regression Training (linear_regression_training)
- -Ridge Regression Training (ridge_regression_training)
- -Multinomial Naive Bayes Training (multinomial_naive_bayes_training)
-K-Means (kmeans_init and kmeans)
-Correlation and Variance-Covariance Matrices (covariance)
-Moments of Low Order (low_order_moments)
- -QR Decomposition (qr)
-The distributed/scaling documentation has moved. You should be redirected automatically. If not, please visit:
+Distributed Mode (daal4py, CPU)
- \ No newline at end of file + diff --git a/daal4py/search.html b/daal4py/search.html old mode 100755 new mode 100644 index 06bb76c..5215a77 --- a/daal4py/search.html +++ b/daal4py/search.html @@ -1,148 +1,15 @@ - + - - -The daal4py documentation has moved. You should be redirected automatically. If not, please visit:
+ +Use the search function on the new documentation site to find what you need.
- \ No newline at end of file + diff --git a/daal4py/searchindex.js b/daal4py/searchindex.js deleted file mode 100755 index 18aacda..0000000 --- a/daal4py/searchindex.js +++ /dev/null @@ -1,2 +0,0 @@ -Search.setIndex({"docnames": ["algorithms", "contents", "data", "examples", "index", "model-builders", "scaling", "sklearn", "streaming"], "filenames": ["algorithms.rst", "contents.rst", "data.rst", "examples.rst", "index.rst", "model-builders.rst", "scaling.rst", "sklearn.rst", "streaming.rst"], "titles": ["Algorithms", "Contents", "Input Data", "Examples", "Fast, Scalable and Easy Machine Learning With DAAL4PY", "Model Builders for the Gradient Boosting Frameworks", "Scaling on Distributed Memory (Multiprocessing)", "Scikit-Learn API and patching", "Streaming Data"], "terms": {"scikit": [0, 1, 2, 3, 6, 8], "learn": [0, 1, 2, 3, 6, 8], "patch": [0, 1, 2, 3, 5, 6, 8], "daal4pi": [0, 1, 2, 3, 5, 6, 7, 8], "wa": [0, 1, 2, 3, 4, 5, 6, 7, 8], "deprec": [0, 1, 2, 3, 4, 5, 6, 8], "move": [0, 1, 2, 3, 4, 5, 6, 7, 8], "separ": [0, 1, 2, 3, 4, 5, 6, 7, 8], "packag": [0, 1, 2, 3, 4, 5, 6, 7, 8], "intel": [0, 1, 2, 3, 4, 5, 6, 7, 8], "r": [0, 1, 2, 3, 4, 5, 6, 7, 8], "extens": [0, 1, 2, 3, 4, 5, 6, 7, 8], "all": [0, 1, 2, 3, 4, 5, 6, 7, 8], "futur": [0, 1, 2, 3, 4, 5, 6, 7, 8], "avail": [0, 1, 2, 3, 4, 5, 6, 7, 8], "onli": [0, 1, 2, 3, 4, 5, 6, 7, 8], "us": [0, 1, 2, 3, 4, 5, 6, 7, 8], "intelex": [0, 1, 2, 3, 4, 5, 6, 7, 8], "instead": [0, 1, 2, 3, 4, 5, 6, 7, 8], "acceler": [0, 1, 2, 3, 4, 5, 6, 8], "see": [0, 4], "also": [0, 4, 5, 6, 7, 8], "oneapi": [0, 1, 7], "data": [0, 1, 5, 6, 7], "analyt": [0, 4, 7], "librari": [0, 4, 6, 7], "paramet": [0, 4, 6, 7], "semant": 0, "ar": [0, 3, 4, 5, 6, 7], "describ": 0, "exampl": [0, 1, 4, 7], "singl": [0, 3, 4, 6], "process": [0, 3, 4, 6, 8], "default": [0, 2, 3, 4], "dens": [0, 3, 7], "histogram": [0, 3], "class": [0, 3, 4, 5, 7], "decision_forest_classification_train": 0, "nclass": 0, "size_t": 0, "fptype": 0, "str": 0, "option": [0, 4], "doubl": 0, "type": [0, 2, 4], "intermedi": 0, "comput": [0, 2, 4, 6, 8], "float": [0, 4], "defaultdens": 0, "resultstoevalu": 0, "64": [0, 4], "bit": [0, 4], "integ": [0, 4], "flag": [0, 7], "indic": [0, 7], "result": [0, 4, 5, 6, 8], "ntree": 0, "1": [0, 4, 5, 7], "i": [0, 2, 4, 5, 6, 7, 8], "10": [0, 4, 6], "observationspertreefract": 0, "get_nan64": 0, "fraction": 0, "observ": [0, 5, 7], "train": [0, 4, 5, 6, 8], "one": [0, 4, 5, 6, 7], "0": [0, 7], "sampl": 0, "replac": [0, 4], "featurespernod": 0, "featur": [0, 4, 5, 7], "tri": 0, "possibl": [0, 4, 5, 6, 7], "split": [0, 4], "per": [0, 4, 5], "node": [0, 4], "If": [0, 4, 7], "sqrt": 0, "p": [0, 7], "3": 0, "where": 0, "total": 0, "maxtreedepth": 0, "depth": 0, "unlimit": 0, "minobservationsinleafnod": 0, "minim": [0, 2, 4, 6], "leaf": 0, "5": [0, 7], "engines_batchbase__iface__": 0, "none": [0, 4, 7], "gener": [0, 1, 4, 8], "impuritythreshold": 0, "threshold": 0, "stop": [0, 6], "criteria": 0, "impur": 0, "smaller": [0, 4], "than": [0, 4, 8], "anymor": 0, "varimport": 0, "variabl": [0, 5, 7], "import": [0, 4, 5, 6, 7], "mode": [0, 1, 4, 6, 8], "resultstocomput": 0, "memorysavingmod": 0, "bool": 0, "fals": [0, 7], "true": [0, 4, 5, 6, 7, 8], "save": 0, "slower": 0, "bootstrap": 0, "set": [0, 4, 7], "whole": 0, "minobservationsinsplitnod": 0, "2": [0, 4, 7], "minweightfractioninleafnod": 0, "The": [0, 2, 4, 5, 6, 7, 8], "minimum": 0, "weight": 0, "sum": 0, "input": [0, 4, 6, 8], "requir": [0, 2, 4, 6], "minimpuritydecreaseinsplitnod": 0, "A": [0, 4], "thi": [0, 4, 6, 7, 8], "induc": 0, "decreas": 0, "greater": 0, "equal": 0, "non": [0, 2, 4, 5], "neg": 0, "maxleafnod": 0, "maximum": 0, "maxbin": 0, "hist": 0, "find": [0, 4, 7], "discret": 0, "bin": 0, "bucket": 0, "continu": 0, "256": 0, "increas": [0, 4], "higher": 0, "cost": 0, "minbins": 0, "splitter": 0, "best": [0, 2, 4, 5], "binningstrategi": 0, "strategi": 0, "group": 0, "point": [0, 4], "allow": [0, 4, 6, 7, 8], "label": 0, "do": [0, 2, 4, 7], "actual": [0, 6, 8], "provid": [0, 2, 4, 6, 7, 8], "data_or_fil": 0, "return": [0, 4, 5], "decision_forest_classification_training_result": 0, "properti": [0, 4], "decision_forest_classification_model": 0, "outofbagerror": 0, "numpi": [0, 1, 4], "arrai": [0, 1, 4, 6, 8], "outofbagerroraccuraci": 0, "outofbagerrordecisionfunct": 0, "outofbagerrorperobserv": 0, "variableimport": 0, "decision_forest_classification_predict": 0, "decision_forest": 0, "votingmethod": 0, "decision_forest_classification_modelptr": 0, "classifier_prediction_result": 0, "logprob": 0, "predict": [0, 4, 5], "probabl": [0, 5], "nfeatur": 0, "numberofclass": 0, "numberoffeatur": 0, "numberoftre": 0, "decision_tree_classification_train": 0, "prune": 0, "can": [0, 2, 4, 5, 6, 7, 8], "ani": [0, 4, 6], "posit": 0, "nbin": 0, "belong": 0, "current": [0, 5, 7], "version": [0, 7], "splitcriterion": 0, "criterion": [0, 7], "dataforprun": 0, "labelsforprun": 0, "decision_tree_classification_training_result": 0, "decision_tree_classification_model": 0, "decision_tree_classification_predict": 0, "batch": 0, "decision_tree_classification_modelptr": 0, "gbt_classification_train": 0, "variableimportancemod": 0, "splitmethod": 0, "exact": 0, "maxiter": 0, "50": 0, "6": 0, "rate": 0, "procedur": 0, "scale": [0, 4, 7], "contribut": [0, 5], "each": [0, 4, 5, 6], "factor": 0, "minsplitloss": 0, "regular": 0, "reduct": [0, 7], "make": [0, 4, 5], "further": 0, "partit": 0, "rang": 0, "inf": 0, "lambda": 0, "l2": 0, "entir": [0, 2, 4], "dataset": [0, 5, 7], "inexact": 0, "internalopt": 0, "int": 0, "intern": [0, 2, 4], "gbt_classification_training_result": 0, "gbt_classification_model": 0, "variableimportancebycov": 0, "variableimportancebygain": 0, "variableimportancebytotalcov": 0, "variableimportancebytotalgain": 0, "variableimportancebyweight": 0, "gbt_classification_predict": 0, "gbt": [0, 5], "niter": 0, "gbt_classification_modelptr": 0, "predictionbia": 0, "kdtree_knn_classification_train": 0, "kd": 0, "datauseinmodel": 0, "enabl": [0, 7], "disabl": [0, 7], "an": [0, 2, 4, 5, 6, 7, 8], "usag": [0, 1, 5], "choos": 0, "element": 0, "from": [0, 3, 4, 5, 6, 7, 8], "voteweight": 0, "kdtree_knn_classification_training_result": 0, "kdtree_knn_classification_model": 0, "kdtree_knn_classification_predict": 0, "kdtree_knn_classification_modelptr": 0, "kdtree_knn_classification_prediction_result": 0, "bf_knn_classification_train": 0, "bf": 0, "bf_knn_classification_training_result": 0, "bf_knn_classification_model": 0, "bf_knn_classification_predict": 0, "bf_knn_classification_modelptr": 0, "bf_knn_classification_prediction_result": 0, "adaboost_train": 0, "weaklearnertrain": 0, "classifier_training_batch__iface__": 0, "weaklearnerpredict": 0, "classifier_prediction_batch__iface__": 0, "accuracythreshold": 0, "accuraci": 0, "learningr": 0, "multipli": 0, "classifi": 0, "shrink": 0, "its": [0, 2, 4], "adaboost_training_result": 0, "adaboost_model": 0, "weaklearnerserror": 0, "adaboost_predict": 0, "adaboost_modelptr": 0, "alpha": 0, "numberofweaklearn": 0, "weaklearnermodel": 0, "idx": 0, "classifier_model": 0, "deriv": 0, "brownboost_train": 0, "newtonraphsonaccuracythreshold": 0, "newton": [0, 7], "raphson": 0, "newtonraphsonmaxiter": 0, "degeneratecasesthreshold": 0, "need": [0, 4, 6], "avoid": 0, "degener": 0, "case": [0, 4, 8], "brownboost_training_result": 0, "brownboost_model": 0, "brownboost_predict": 0, "brownboost_modelptr": 0, "logitboost_train": 0, "friedman": 0, "regression_training_batch__iface__": 0, "regression_prediction_batch__iface__": 0, "term": [0, 5], "addit": [0, 5, 7], "weightsdegeneratecasesthreshold": 0, "when": [0, 4, 6, 8], "calcul": [0, 1], "w": 0, "responsesdegeneratecasesthreshold": 0, "respons": [0, 4], "logitboost_training_result": 0, "logitboost_model": 0, "logitboost_predict": 0, "logitboost_modelptr": 0, "regression_model": 0, "stump_classification_train": 0, "stump_classification_training_result": 0, "stump_classification_model": 0, "stump_classification_predict": 0, "stump_classification_modelptr": 0, "leftvalu": 0, "rightvalu": 0, "splitfeatur": 0, "splitvalu": 0, "stream": [0, 1, 3, 4], "multi": [0, 3, 7], "multinomial_naive_bayes_train": [0, 6, 8], "priorclassestim": 0, "prior": 0, "estim": [0, 7], "imagin": 0, "occurr": 0, "word": 0, "spmd": [0, 6], "multinomial_naive_bayes_training_result": 0, "multinomial_naive_bayes_model": 0, "multinomial_naive_bayes_predict": 0, "multinomial_naive_bayes_modelptr": 0, "auxtabl": 0, "logp": 0, "logtheta": 0, "note": [0, 2, 4], "For": [0, 4, 5, 7, 8], "format": [0, 2], "svm_train": 0, "boser": 0, "c": [0, 4, 7], "upper": 0, "bound": 0, "constraint": 0, "quadrat": 0, "problem": 0, "tau": 0, "work": [0, 2, 4, 5, 6], "scheme": 0, "caches": 0, "size": [0, 4], "cach": 0, "byte": 0, "store": [0, 5], "kernel": [0, 4, 7], "zero": 0, "techniqu": 0, "doshrink": 0, "shrinkingstep": 0, "between": [0, 4], "step": [0, 5], "kernel_function_kerneliface__iface__": 0, "svm_training_result": 0, "svm_model": 0, "svm_predict": 0, "svm_modelptr": 0, "bia": [0, 5], "classificationcoeffici": 0, "supportindic": 0, "supportvector": 0, "binari": [0, 3, 6], "logistic_regression_train": 0, "interceptflag": [0, 4], "whether": [0, 7], "intercept": 0, "penaltyl1": 0, "get_nan32": 0, "l1": 0, "coeffici": 0, "appli": [0, 7], "penaltyl2": 0, "optimizationsolv": 0, "optimization_solver_iterative_solver_batch__iface__": 0, "sgd": [0, 3], "momentum": 0, "logistic_regression_training_result": 0, "logistic_regression_model": 0, "logistic_regression_predict": 0, "logistic_regression_modelptr": 0, "beta": 0, "numberofbeta": 0, "decision_forest_regression_train": 0, "dependentvari": 0, "tabl": [0, 2, 4], "depend": [0, 4, 7], "decision_forest_regression_training_result": 0, "decision_forest_regression_model": 0, "outofbagerrorpredict": 0, "outofbagerrorr2": 0, "decision_forest_regression_predict": 0, "decision_forest_regression_modelptr": 0, "decision_forest_regression_prediction_result": 0, "decision_tree_regression_train": 0, "dependentvariablesforprun": 0, "decision_tree_regression_training_result": 0, "decision_tree_regression_model": 0, "decision_tree_regression_predict": 0, "decision_tree_regression_modelptr": 0, "decision_tree_regression_prediction_result": 0, "gbt_regression_train": 0, "gbt_regression_training_result": 0, "gbt_regression_model": 0, "gbt_regression_predict": 0, "gbt_regression_modelptr": 0, "gbt_regression_prediction_result": 0, "linear_regression_train": [0, 4, 6, 8], "normeqdens": 0, "linear_regression_training_result": 0, "linear_regression_model": 0, "linear_regression_predict": [0, 4], "linear_regression_modelptr": 0, "linear_regression_prediction_result": 0, "numberofrespons": 0, "lasso": [0, 7], "lasso_regression_train": 0, "lassoparamet": 0, "numer": [0, 2, 5], "contain": [0, 7], "coordin": 0, "datauseincomput": 0, "corrupt": 0, "optresulttocomput": 0, "grammatrix": 0, "numerict": [0, 4], "x": [0, 5, 7], "n": [0, 6], "last": [0, 4, 7], "lasso_regression_training_result": 0, "grammatrixid": 0, "lasso_regression_model": 0, "lasso_regression_predict": 0, "lasso_regression_modelptr": 0, "lasso_regression_prediction_result": 0, "ridge_regression_train": [0, 6, 8], "ridgeparamet": 0, "ridge_regression_training_result": 0, "ridge_regression_model": 0, "ridge_regression_predict": 0, "ridge_regression_modelptr": 0, "ridge_regression_prediction_result": 0, "stump_regression_train": 0, "some": [0, 2, 4], "skip": 0, "backward": 0, "compat": [0, 4, 7], "stump_regression_training_result": 0, "stump_regression_model": 0, "stump_regression_predict": 0, "stump_regression_modelptr": 0, "stump_regression_prediction_result": 0, "correlationdens": 0, "ncompon": 0, "reduc": 0, "implement": [0, 5, 6, 7], "isdeterminist": 0, "sign": 0, "flip": 0, "doscal": 0, "iscorrel": 0, "normalization_zscore_batchimpl__iface__": 0, "pointer": 0, "pca_result": 0, "datafortransform": 0, "eigenvalu": 0, "eigenvector": 0, "pca_transform": 0, "dict_numerictableptr": 0, "pca_transform_result": 0, "transformeddata": 0, "kmeans_init": [0, 4, 6], "ncluster": 0, "ntrial": 0, "kmean": [0, 4, 6, 7], "trial": 0, "first": [0, 4, 5], "oversamplingfactor": 0, "being": [0, 5, 6, 7], "chosen": 0, "nround": 0, "l": 0, "round": 0, "kmeans_init_result": 0, "centroid": [0, 4], "lloyddens": 0, "termin": 0, "gamma": [0, 7], "categor": [0, 5], "distancetyp": 0, "assignflag": 0, "assign": 0, "param": 0, "inputcentroid": 0, "kmeans_result": 0, "objectivefunct": 0, "dbscan": [0, 7], "epsilon": 0, "radiu": 0, "neighborhood": 0, "minobserv": 0, "core": [0, 4], "blockindex": 0, "uniqu": 0, "identifi": 0, "block": [0, 4], "pass": [0, 4, 5, 7], "local": 0, "nblock": 0, "leftblock": 0, "lesser": 0, "rightblock": 0, "dbscan_result": 0, "coreindic": 0, "coreobserv": 0, "multivariate_outlier_detect": 0, "locat": 0, "scatter": 0, "measur": 0, "spread": 0, "defin": 0, "region": 0, "multivariate_outlier_detection_result": 0, "univariate_outlier_detect": 0, "standard": [0, 4, 6], "deviat": 0, "univariate_outlier_detection_result": 0, "bacon_outlier_detect": 0, "initmethod": 0, "One": [0, 4], "tail": 0, "lpha": 0, "chi": 0, "degre": 0, "freedom": 0, "recommend": [0, 4], "tolerancetoconverg": 0, "basic": 0, "subset": [0, 7], "chang": [0, 4, 6], "less": [0, 2, 4], "bacon_outlier_detection_result": 0, "In": [0, 3, 4, 5, 7, 8], "adagrad": [0, 3], "lbfg": [0, 3, 7], "optimization_solver_ms": 0, "numberofterm": 0, "batchindic": 0, "m": [0, 7], "repres": 0, "e": [0, 2, 4, 5, 6, 8], "g": [0, 2, 4, 6, 8], "featureid": 0, "index": [0, 4], "part": 0, "hessian": 0, "proxim": 0, "project": 0, "argument": [0, 2, 4, 5], "optimization_solver_objective_function_result": 0, "setup": 0, "partial": 0, "other": [0, 4, 6, 7, 8], "optimization_solver_mse_result": 0, "alia": 0, "optimization_solver_logistic_loss": 0, "optimization_solver_logistic_loss_result": 0, "optimization_solver_cross_entropy_loss": 0, "differ": [0, 2, 4, 5], "optimization_solver_cross_entropy_loss_result": 0, "optimization_solver_sgd": 0, "optimization_solver_sum_of_functions_batch__iface__": 0, "32": [0, 4], "learningratesequ": 0, "sequenc": 0, "achiev": 0, "optionalresultrequir": 0, "batchsiz": 0, "perform": [0, 1, 5], "ignor": 0, "conservativesequ": 0, "conserv": 0, "innerniter": 0, "inputargu": 0, "start": 0, "optimization_solver_sgd_result": 0, "optimization_solver_lbfg": 0, "correct": 0, "pair": 0, "approxim": 0, "invers": 0, "curvatur": 0, "correctionpairbatchs": 0, "sub": 0, "correctionpairbatchindic": 0, "steplengthsequ": 0, "optimization_solver_lbfgs_result": 0, "optimization_solver_adagrad": 0, "root": 0, "optimization_solver_adagrad_result": 0, "saga": 0, "proce": 0, "logistc_loss": 0, "optimization_solver_saga": 0, "gradientst": 0, "accumul": 0, "correspond": [0, 5], "": [0, 1, 2, 7, 8], "optimization_solver_saga_result": 0, "cosine_dist": 0, "cosine_distance_result": 0, "cosinedist": 0, "correlation_dist": 0, "correlation_distance_result": 0, "correlationdist": 0, "em_gmm_init": 0, "gmm": 0, "short": 0, "run": [0, 4, 6, 7], "everi": 0, "covariancestorag": 0, "randomli": 0, "em_gmm_init_result": 0, "em_gmm": 0, "regularizationfactor": 0, "ill": 0, "condit": 0, "inputweight": 0, "inputmean": 0, "inputcovari": 0, "list_numerictableptr": 0, "collect": 0, "em_gmm_result": 0, "goalfunct": 0, "qr_result": 0, "matrixq": 0, "matrixr": 0, "pivoted_qr": 0, "permutedcolumn": 0, "On": [0, 4, 7], "entri": 0, "th": 0, "column": [0, 2, 5], "begin": 0, "befor": [0, 5], "fix": [0, 4], "place": 0, "dure": [0, 7], "free": 0, "mai": 0, "interchang": 0, "pivoted_qr_result": 0, "permutationmatrix": 0, "normalization_zscor": 0, "boolean": 0, "both": [0, 4], "center": 0, "otherwis": [0, 2], "normalization_zscore_result": 0, "normalizeddata": 0, "normalization_minmax": 0, "lowerbound": 0, "lower": 0, "obtain": [0, 8], "upperbound": 0, "normalization_minmax_result": 0, "engines_result": 0, "randomnumb": 0, "engines_mt19937": 0, "seed": 0, "tabletofil": 0, "fill": 0, "engines_mt19937_result": 0, "engines_mt2203": 0, "engines_mt2203_result": 0, "engines_mcg59": 0, "engines_mcg59_result": 0, "distributions_bernoulli": 0, "success": 0, "distributions_result": 0, "distributions_bernoulli_result": 0, "distributions_norm": 0, "sigma": 0, "distributions_normal_result": 0, "distributions_uniform": 0, "left": 0, "b": 0, "right": 0, "distributions_uniform_result": 0, "association_rul": 0, "apriori": 0, "minsupport": 0, "minconfid": 0, "confid": 0, "nuniqueitem": 0, "item": 0, "ntransact": 0, "transact": 0, "discoverrul": 0, "built": [0, 1], "larg": [0, 4, 8], "itemset": 0, "itemsetsord": 0, "rulesord": 0, "minitemsets": 0, "maxitemsets": 0, "boundari": 0, "association_rules_result": 0, "antecedentitemset": 0, "consequentitemset": 0, "largeitemset": 0, "largeitemsetssupport": 0, "cholesky_result": 0, "choleskyfactor": 0, "outputmatrixtyp": 0, "covariance_result": 0, "implicit_als_train": 0, "nfactor": 0, "preferencethreshold": 0, "prefer": 0, "inputmodel": 0, "implicit_als_modelptr": 0, "implicit_als_training_result": 0, "implicit_als_model": 0, "itemsfactor": 0, "usersfactor": 0, "implicit_als_prediction_r": 0, "implicit_als_prediction_ratings_result": 0, "low_order_mo": [0, 6], "estimatestocomput": 0, "low_order_moments_result": 0, "secondorderrawmo": 0, "standarddevi": 0, "sumsquar": 0, "sumsquarescent": 0, "variat": 0, "quantileord": 0, "median": 0, "quantiles_result": 0, "leftsingularmatrix": 0, "rightsingularmatrix": 0, "svd_result": 0, "singularvalu": 0, "sorting_result": 0, "sorteddata": 0, "gettreest": 0, "n_class": 0, "function": [1, 2, 3, 4, 5, 6, 7, 8], "about": 1, "design": 1, "scientist": 1, "framework": [1, 3], "api": [1, 5], "gpu": 1, "support": [1, 3, 5, 7], "get": [1, 6, 7], "overview": 1, "panda": [1, 4], "datafram": [1, 4, 6, 8], "scipi": [1, 4], "spars": [1, 7], "csr": 1, "matrix": [1, 3], "csv": [1, 4, 6], "file": [1, 4, 6, 8], "model": [1, 3, 4], "builder": 1, "introduct": 1, "convers": [1, 3], "classif": [1, 3, 7], "regress": [1, 3, 4, 6, 7, 8], "infer": [1, 4], "shap": 1, "valu": [1, 3, 7], "limit": [1, 3, 7], "articl": 1, "blog": 1, "post": 1, "algorithm": [1, 2, 3, 4, 5, 7], "princip": [1, 3], "compon": [1, 3], "analysi": [1, 3], "pca": [1, 3, 6, 7], "k": [1, 3, 4, 6], "mean": [1, 3, 4, 6, 7], "cluster": [1, 3, 4, 6, 7], "densiti": 1, "base": [1, 5], "spatial": 1, "applic": [1, 7], "nois": 1, "outlier": [1, 3], "detect": [1, 3], "optim": [1, 2, 3, 7], "solver": [1, 3, 4, 7], "distanc": [1, 3], "expect": [1, 6], "maxim": 1, "em": 1, "qr": [1, 6, 8], "decomposit": [1, 3, 6, 7], "normal": [1, 7], "random": 1, "number": [1, 4, 5, 6], "engin": [1, 6], "distribut": [1, 4, 7], "associ": [1, 4], "rule": 1, "choleski": 1, "correl": [1, 3, 6, 7], "varianc": [1, 3, 6], "covari": [1, 3, 6, 8], "matric": [1, 2, 3, 6], "implicit": 1, "altern": 1, "least": [1, 4], "squar": [1, 3], "al": 1, "moment": [1, 3, 6, 8], "low": [1, 3, 6, 8], "order": [1, 3, 6, 8], "quantil": 1, "singular": [1, 3], "svd": [1, 3, 4, 6, 8], "sort": 1, "tree": [1, 3, 5, 7], "It": [1, 2, 4, 7], "easi": [1, 8], "notic": 1, "oned": [1, 4, 5], "verbos": 1, "constructor": 2, "automat": 2, "overhead": 2, "most": [2, 5], "notabl": 2, "without": [2, 4, 7], "copi": 2, "directli": [2, 4], "handl": [2, 4], "homogen": 2, "simpl": 2, "dtype": 2, "heterogen": 2, "structur": 2, "well": 2, "contigu": [2, 4], "accept": [2, 4, 8], "No": [2, 7], "extra": 2, "full": [2, 4, 7], "csr_matrix": 2, "configur": [2, 4, 8], "path": 2, "explicitli": 2, "specifi": [2, 7], "method": [2, 3, 4, 5, 6], "effici": [2, 4, 5, 7], "addition": [2, 4], "filenam": 2, "daal": [2, 4], "fast": 2, "reader": 2, "creat": [2, 4, 5, 7], "below": [3, 4, 7], "how": 3, "util": [3, 4], "variou": 3, "style": [3, 6], "build": [3, 4], "gradient": 3, "boost": 3, "xgboost": [3, 5], "lightgbm": [3, 5], "catboost": [3, 5], "transform": [3, 7], "decis": [3, 5], "forest": 3, "nearest": 3, "neighbor": [3, 7], "knn": 3, "multinomi": [3, 6, 8], "naiv": [3, 6, 8], "bay": [3, 6, 8], "vector": 3, "machin": [3, 5], "svm": [3, 7], "muticlass": 3, "logist": 3, "linear": [3, 4, 6, 8], "ridg": [3, 6, 7, 8], "multivari": 3, "univari": 3, "error": 3, "mse": [3, 7], "loss": 3, "stochast": 3, "descent": 3, "memori": [3, 4, 8], "broyden": 3, "fletcher": 3, "goldfarb": 3, "shanno": 3, "adapt": 3, "subgradi": 3, "cosin": [3, 7], "your": [4, 5, 6, 8], "python": [4, 5, 6, 7], "lightn": 4, "highli": 4, "which": [4, 6, 7, 8], "easili": 4, "out": [4, 7], "workstat": [4, 6], "deliv": [4, 5], "give": 4, "easiest": 4, "wai": [4, 8], "power": [4, 7], "high": 4, "product": 4, "manner": 4, "simplifi": 4, "level": 4, "abstract": 4, "user": 4, "boilerpl": 4, "quick": 4, "write": 4, "maintain": 4, "code": [4, 6, 7], "jupyt": 4, "notebook": 4, "capabl": 4, "abil": 4, "Its": 4, "flexibl": 4, "mechan": [4, 6], "amount": 4, "ha": [4, 5, 7], "been": [4, 7], "fashion": 4, "under": [4, 6], "perspect": 4, "export": [4, 7], "serial": 4, "desir": 4, "primit": 4, "custom": 4, "behavior": 4, "itself": [4, 7], "loadout": 4, "footprint": 4, "necessari": [4, 6], "As": 4, "would": 4, "scienc": 4, "context": 4, "workflow": 4, "showcas": 4, "d4p": [4, 5], "test": [4, 7], "target": [4, 7], "d4p_lm": 4, "lm_train": 4, "lm_predictor_compon": 4, "abov": 4, "seen": 4, "divid": 4, "grid": 4, "search": 4, "modifi": 4, "direct": 4, "better": 4, "integr": 4, "stack": 4, "construct": [4, 6, 8], "rich": 4, "assum": [4, 6], "we": [4, 6], "want": 4, "initi": [4, 6], "plusplu": 4, "kmi": [4, 6], "plusplusdens": [4, 6], "have": [4, 6], "our": 4, "now": [4, 6], "call": [4, 6, 7, 8], "hold": 4, "attribut": [4, 5], "print": [4, 7], "could": [4, 6], "look": [4, 6], "like": [4, 6], "even": 4, "simpli": [4, 8], "ad": [4, 7], "final": [4, 6, 8], "network": 4, "keyword": [4, 5], "daalinit": [4, 6], "daalfini": [4, 6], "my_fil": 4, "algo": [4, 8], "stream_or_filelist": 4, "sever": [4, 6], "technologi": 4, "jinja": 4, "templat": 4, "cython": 4, "wrap": 4, "header": 4, "bridg": 4, "layer": 4, "quicker": 4, "develop": 4, "cycl": 4, "act": 4, "refer": 4, "those": [4, 5, 7], "tailor": 4, "good": 4, "pickl": 4, "besid": [4, 8], "superior": 4, "close": 4, "nativ": [4, 5, 7], "excel": 4, "strong": 4, "weak": 4, "nice": 4, "orang": 4, "address": 4, "time": 4, "grow": 4, "yellow": 4, "longer": 4, "fit": [4, 5, 7], "1280": 4, "15": 4, "tb": 4, "18": 4, "second": 4, "68": 4, "66": 4, "gb": 4, "48": 4, "millisecond": 4, "12": 4, "107": 4, "4": [4, 6], "35": 4, "76": 4, "8": 4, "xeon": 4, "gold": 4, "6148": 4, "cpu": [4, 7], "40ghz": 4, "eist": 4, "turbo": 4, "socket": 4, "20": 4, "192": 4, "ram": 4, "16": 4, "connect": 4, "infiniband": 4, "oracl": 4, "linux": [4, 7], "server": 4, "releas": [4, 7], "7": 4, "anaconda": 4, "cloud": 4, "conda": 4, "forg": 4, "channel": 4, "sourc": 4, "instruct": 4, "repositori": 4, "via": 4, "same": [4, 5, 6, 7], "platform": 4, "http": 4, "github": 4, "io": 4, "latest": [4, 7], "system": 4, "html": 4, "_": 4, "instal": 4, "pypi": 4, "pip": 4, "\u0441onda": 4, "you": [4, 5, 7, 8], "instanti": 4, "parameter": 4, "list": 4, "optarg": 4, "77": 4, "object": 4, "extract": 4, "name": 4, "content": 4, "what": 4, "expos": 4, "furthermor": 4, "monkei": [4, 7], "sklearn": [4, 5, 7], "drop": [4, 5], "pleas": [4, 7], "section": 4, "more": 4, "detail": 4, "accur": 5, "popular": 5, "tune": 5, "architectur": 5, "experiment": 5, "convert": 5, "alreadi": 5, "d4p_model": 5, "mb": 5, "convert_model": 5, "xgb_model": 5, "lgb_model": 5, "cb_model": 5, "onc": [5, 8], "origin": [5, 7], "d4p_predict": 5, "either": 5, "output": [5, 7], "test_data": 5, "here": [5, 8], "made": 5, "interact": 5, "take": 5, "pred_contrib": 5, "pred_interact": 5, "shape": 5, "n_row": 5, "n_featur": 5, "row": 5, "includ": [5, 7], "compris": 5, "combin": 5, "along": 5, "consist": 5, "contrast": 5, "fewer": 5, "gbtdaalclassifi": 5, "gbtdaalregressor": 5, "ensembl": [5, 7], "reg": 5, "xgb": 5, "xgbregressor": 5, "y": [5, 7], "d4p_predt": 5, "extend": 5, "therefor": 5, "follow": [5, 6, 7, 8], "multioutput": 5, "improv": 5, "oper": [6, 8], "program": [6, 7], "multipl": [6, 8], "execut": [6, 7], "similar": 6, "mpi": 6, "commun": 6, "synchron": 6, "happen": 6, "hood": 6, "mpi4pi": 6, "though": 6, "veri": 6, "add": 6, "tell": 6, "should": [6, 7], "usual": 6, "done": [6, 8], "condition": 6, "id": 6, "rank": 6, "my_procid": 6, "prefix": 6, "suffix": 6, "That": 6, "To": [6, 7], "mpirun": 6, "py": [6, 7], "compil": 6, "interfac": 7, "etc": 7, "nearli": 7, "dynam": 7, "underli": 7, "while": 7, "solut": 7, "faster": 7, "edit": 7, "commandlin": 7, "my_appl": 7, "through": 7, "environ": 7, "use_daal4py_sklearn": 7, "ye": 7, "shown": 7, "mac": 7, "o": [7, 8], "window": 7, "programmat": 7, "patch_sklearn": 7, "undo": 7, "unpatch_sklearn": 7, "impact": 7, "exist": 7, "task": 7, "svc": 7, "except": 7, "poli": 7, "sigmoid": 7, "randomforestclassifi": 7, "warm_start": 7, "cpp_alpha": 7, "gini": 7, "oob_scor": 7, "bag": 7, "score": 7, "kneighborsclassifi": 7, "metric": 7, "euclidean": 7, "minkowski": 7, "logisticregress": 7, "cg": 7, "class_weight": 7, "sample_weight": 7, "randomforestregressor": 7, "kneighborsregressor": 7, "linearregress": 7, "auto": 7, "elasticnet": 7, "precompute_dist": 7, "dimension": 7, "svd_solver": 7, "unsupervis": 7, "nearestneighbor": 7, "train_test_split": 7, "assert_all_finit": 7, "pairwise_dist": 7, "With": 7, "roc_auc_scor": 7, "averag": 7, "max_fpr": 7, "multi_class": 7, "own": 7, "suit": 7, "few": 7, "deselected_test": 7, "yaml": 7, "particular": 7, "check_estim": 7, "discov": 7, "introspect": 7, "assur": 7, "four": 7, "2021": 7, "21": 7, "22": 7, "23": 7, "24": 7, "idp_sklearn_verbos": 7, "info": 7, "receiv": 7, "statement": 7, "These": 7, "fallback": 7, "decisiontreeclassifi": 7, "adaboostclassifi": 7, "linear_model": 7, "logistic_regression_path": 7, "model_select": 7, "_daal_train_test_split": 7, "_daal_roc_auc_scor": 7, "alwai": 7, "digit": 7, "load_digit": 7, "clf_d": 7, "rbf": 7, "clf_v": 7, "9905397885364496": 7, "quantiti": 8, "might": 8, "imposs": 8, "becaus": 8, "resid": 8, "merg": 8, "costli": 8, "feasibl": 8, "too": 8, "load": 8, "complet": 8, "Or": 8, "come": 8, "certain": 8, "interleav": 8, "repeat": 8, "chunk": 8, "f": 8, "input_fil": 8, "rather": 8, "simul": 8, "read": 8}, "objects": {"daal4py": [[0, 0, 1, "", "adaboost_model"], [0, 0, 1, "", "adaboost_prediction"], [0, 0, 1, "", "adaboost_training"], [0, 0, 1, "", "adaboost_training_result"], [0, 0, 1, "", "association_rules"], [0, 0, 1, "", "association_rules_result"], [0, 0, 1, "", "bacon_outlier_detection"], [0, 0, 1, "", "bacon_outlier_detection_result"], [0, 0, 1, "", "bf_knn_classification_model"], [0, 0, 1, "", "bf_knn_classification_prediction"], [0, 0, 1, "", "bf_knn_classification_training"], [0, 0, 1, "", "bf_knn_classification_training_result"], [0, 0, 1, "", "brownboost_model"], [0, 0, 1, "", "brownboost_prediction"], [0, 0, 1, "", "brownboost_training"], [0, 0, 1, "", "brownboost_training_result"], [0, 0, 1, "", "cholesky"], [0, 0, 1, "", "cholesky_result"], [0, 0, 1, "id40", "classifier_prediction_result"], [0, 0, 1, "", "correlation_distance"], [0, 0, 1, "", "correlation_distance_result"], [0, 0, 1, "", "cosine_distance"], [0, 0, 1, "", "cosine_distance_result"], [0, 0, 1, "", "covariance"], [0, 0, 1, "", "covariance_result"], [0, 0, 1, "", "dbscan"], [0, 0, 1, "", "dbscan_result"], [0, 0, 1, "", "decision_forest_classification_model"], [0, 0, 1, "", "decision_forest_classification_prediction"], [0, 0, 1, "", "decision_forest_classification_training"], [0, 0, 1, "", "decision_forest_classification_training_result"], [0, 0, 1, "", "decision_forest_regression_model"], [0, 0, 1, "", "decision_forest_regression_prediction"], [0, 0, 1, "", "decision_forest_regression_prediction_result"], [0, 0, 1, "", "decision_forest_regression_training"], [0, 0, 1, "", "decision_forest_regression_training_result"], [0, 0, 1, "", "decision_tree_classification_model"], [0, 0, 1, "", "decision_tree_classification_prediction"], [0, 0, 1, "", "decision_tree_classification_training"], [0, 0, 1, "", "decision_tree_classification_training_result"], [0, 0, 1, "", "decision_tree_regression_model"], [0, 0, 1, "", "decision_tree_regression_prediction"], [0, 0, 1, "", "decision_tree_regression_prediction_result"], [0, 0, 1, "", "decision_tree_regression_training"], [0, 0, 1, "", "decision_tree_regression_training_result"], [0, 0, 1, "", "distributions_bernoulli"], [0, 1, 1, "", "distributions_bernoulli_result"], [0, 0, 1, "", "distributions_normal"], [0, 1, 1, "", "distributions_normal_result"], [0, 0, 1, "", "distributions_uniform"], [0, 1, 1, "", "distributions_uniform_result"], [0, 0, 1, "", "em_gmm"], [0, 0, 1, "", "em_gmm_init"], [0, 0, 1, "", "em_gmm_init_result"], [0, 0, 1, "", "em_gmm_result"], [0, 0, 1, "", "engines_mcg59"], [0, 1, 1, "", "engines_mcg59_result"], [0, 0, 1, "", "engines_mt19937"], [0, 1, 1, "", "engines_mt19937_result"], [0, 0, 1, "", "engines_mt2203"], [0, 1, 1, "", "engines_mt2203_result"], [0, 0, 1, "", "engines_result"], [0, 0, 1, "", "gbt_classification_model"], [0, 0, 1, "", "gbt_classification_prediction"], [0, 0, 1, "", "gbt_classification_training"], [0, 0, 1, "", "gbt_classification_training_result"], [0, 0, 1, "", "gbt_regression_model"], [0, 0, 1, "", "gbt_regression_prediction"], [0, 0, 1, "", "gbt_regression_prediction_result"], [0, 0, 1, "", "gbt_regression_training"], [0, 0, 1, "", "gbt_regression_training_result"], [0, 3, 1, "", "getTreeState"], [0, 0, 1, "", "implicit_als_model"], [0, 0, 1, "", "implicit_als_prediction_ratings"], [0, 0, 1, "", "implicit_als_prediction_ratings_result"], [0, 0, 1, "", "implicit_als_training"], [0, 0, 1, "", "implicit_als_training_result"], [0, 0, 1, "", "kdtree_knn_classification_model"], [0, 0, 1, "", "kdtree_knn_classification_prediction"], [0, 0, 1, "", "kdtree_knn_classification_training"], [0, 0, 1, "", "kdtree_knn_classification_training_result"], [0, 0, 1, "", "kmeans"], [0, 0, 1, "", "kmeans_init"], [0, 0, 1, "", "kmeans_init_result"], [0, 0, 1, "", "kmeans_result"], [0, 0, 1, "", "lasso_regression_model"], [0, 0, 1, "", "lasso_regression_prediction"], [0, 0, 1, "", "lasso_regression_prediction_result"], [0, 0, 1, "", "lasso_regression_training"], [0, 0, 1, "", "lasso_regression_training_result"], [0, 0, 1, "", "linear_regression_model"], [0, 0, 1, "", "linear_regression_prediction"], [0, 0, 1, "", "linear_regression_prediction_result"], [0, 0, 1, "", "linear_regression_training"], [0, 0, 1, "", "linear_regression_training_result"], [0, 0, 1, "", "logistic_regression_model"], [0, 0, 1, "", "logistic_regression_prediction"], [0, 0, 1, "", "logistic_regression_training"], [0, 0, 1, "", "logistic_regression_training_result"], [0, 0, 1, "", "logitboost_model"], [0, 0, 1, "", "logitboost_prediction"], [0, 0, 1, "", "logitboost_training"], [0, 0, 1, "", "logitboost_training_result"], [0, 0, 1, "", "low_order_moments"], [0, 0, 1, "", "low_order_moments_result"], [0, 0, 1, "", "multinomial_naive_bayes_model"], [0, 0, 1, "", "multinomial_naive_bayes_prediction"], [0, 0, 1, "", "multinomial_naive_bayes_training"], [0, 0, 1, "", "multinomial_naive_bayes_training_result"], [0, 0, 1, "", "multivariate_outlier_detection"], [0, 0, 1, "", "multivariate_outlier_detection_result"], [0, 0, 1, "", "normalization_minmax"], [0, 0, 1, "", "normalization_minmax_result"], [0, 0, 1, "", "normalization_zscore"], [0, 0, 1, "", "normalization_zscore_result"], [0, 0, 1, "", "optimization_solver_adagrad"], [0, 0, 1, "", "optimization_solver_adagrad_result"], [0, 0, 1, "", "optimization_solver_cross_entropy_loss"], [0, 1, 1, "", "optimization_solver_cross_entropy_loss_result"], [0, 0, 1, "", "optimization_solver_lbfgs"], [0, 0, 1, "", "optimization_solver_lbfgs_result"], [0, 0, 1, "", "optimization_solver_logistic_loss"], [0, 1, 1, "", "optimization_solver_logistic_loss_result"], [0, 0, 1, "", "optimization_solver_mse"], [0, 1, 1, "", "optimization_solver_mse_result"], [0, 0, 1, "", "optimization_solver_saga"], [0, 0, 1, "", "optimization_solver_saga_result"], [0, 0, 1, "", "optimization_solver_sgd"], [0, 0, 1, "", "optimization_solver_sgd_result"], [0, 0, 1, "", "pca"], [0, 0, 1, "", "pca_result"], [0, 0, 1, "", "pca_transform"], [0, 0, 1, "", "pca_transform_result"], [0, 0, 1, "", "pivoted_qr"], [0, 0, 1, "", "pivoted_qr_result"], [0, 0, 1, "", "qr"], [0, 0, 1, "", "qr_result"], [0, 0, 1, "", "quantiles"], [0, 0, 1, "", "quantiles_result"], [0, 0, 1, "", "ridge_regression_model"], [0, 0, 1, "", "ridge_regression_prediction"], [0, 0, 1, "", "ridge_regression_prediction_result"], [0, 0, 1, "", "ridge_regression_training"], [0, 0, 1, "", "ridge_regression_training_result"], [0, 0, 1, "", "sorting"], [0, 0, 1, "", "sorting_result"], [0, 0, 1, "", "stump_classification_model"], [0, 0, 1, "", "stump_classification_prediction"], [0, 0, 1, "", "stump_classification_training"], [0, 0, 1, "", "stump_classification_training_result"], [0, 0, 1, "", "stump_regression_model"], [0, 0, 1, "", "stump_regression_prediction"], [0, 0, 1, "", "stump_regression_prediction_result"], [0, 0, 1, "", "stump_regression_training"], [0, 0, 1, "", "stump_regression_training_result"], [0, 0, 1, "", "svd"], [0, 0, 1, "", "svd_result"], [0, 0, 1, "", "svm_model"], [0, 0, 1, "", "svm_prediction"], [0, 0, 1, "", "svm_training"], [0, 0, 1, "", "svm_training_result"], [0, 0, 1, "", "univariate_outlier_detection"], [0, 0, 1, "", "univariate_outlier_detection_result"]], "daal4py.adaboost_model": [[0, 1, 1, "", "Alpha"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfWeakLearners"], [0, 2, 1, "", "WeakLearnerModel"]], "daal4py.adaboost_prediction": [[0, 2, 1, "", "compute"]], "daal4py.adaboost_training": [[0, 2, 1, "", "compute"]], "daal4py.adaboost_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "weakLearnersErrors"]], "daal4py.association_rules": [[0, 2, 1, "", "compute"]], "daal4py.association_rules_result": [[0, 1, 1, "", "antecedentItemsets"], [0, 1, 1, "", "confidence"], [0, 1, 1, "", "consequentItemsets"], [0, 1, 1, "", "largeItemsets"], [0, 1, 1, "", "largeItemsetsSupport"]], "daal4py.bacon_outlier_detection": [[0, 2, 1, "", "compute"]], "daal4py.bacon_outlier_detection_result": [[0, 1, 1, "", "weights"]], "daal4py.bf_knn_classification_model": [[0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"]], "daal4py.bf_knn_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.bf_knn_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.bf_knn_classification_training_result": [[0, 1, 1, "", "model"]], "daal4py.brownboost_model": [[0, 1, 1, "", "Alpha"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfWeakLearners"], [0, 2, 1, "", "WeakLearnerModel"]], "daal4py.brownboost_prediction": [[0, 2, 1, "", "compute"]], "daal4py.brownboost_training": [[0, 2, 1, "", "compute"]], "daal4py.brownboost_training_result": [[0, 1, 1, "", "model"]], "daal4py.cholesky": [[0, 2, 1, "", "compute"]], "daal4py.cholesky_result": [[0, 1, 1, "", "choleskyFactor"]], "daal4py.classifier_prediction_result": [[0, 1, 1, "id41", "logProbabilities"], [0, 1, 1, "id42", "prediction"], [0, 1, 1, "id43", "probabilities"]], "daal4py.correlation_distance": [[0, 2, 1, "", "compute"]], "daal4py.correlation_distance_result": [[0, 1, 1, "", "correlationDistance"]], "daal4py.cosine_distance": [[0, 2, 1, "", "compute"]], "daal4py.cosine_distance_result": [[0, 1, 1, "", "cosineDistance"]], "daal4py.covariance": [[0, 2, 1, "", "compute"]], "daal4py.covariance_result": [[0, 1, 1, "", "correlation"], [0, 1, 1, "", "covariance"], [0, 1, 1, "", "mean"]], "daal4py.dbscan": [[0, 2, 1, "", "compute"]], "daal4py.dbscan_result": [[0, 1, 1, "", "assignments"], [0, 1, 1, "", "coreIndices"], [0, 1, 1, "", "coreObservations"], [0, 1, 1, "", "nClusters"]], "daal4py.decision_forest_classification_model": [[0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfClasses"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfTrees"]], "daal4py.decision_forest_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.decision_forest_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.decision_forest_classification_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "outOfBagError"], [0, 1, 1, "", "outOfBagErrorAccuracy"], [0, 1, 1, "", "outOfBagErrorDecisionFunction"], [0, 1, 1, "", "outOfBagErrorPerObservation"], [0, 1, 1, "", "variableImportance"]], "daal4py.decision_forest_regression_model": [[0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfTrees"]], "daal4py.decision_forest_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.decision_forest_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.decision_forest_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.decision_forest_regression_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "outOfBagError"], [0, 1, 1, "", "outOfBagErrorPerObservation"], [0, 1, 1, "", "outOfBagErrorPrediction"], [0, 1, 1, "", "outOfBagErrorR2"], [0, 1, 1, "", "variableImportance"]], "daal4py.decision_tree_classification_model": [[0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"]], "daal4py.decision_tree_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.decision_tree_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.decision_tree_classification_training_result": [[0, 1, 1, "", "model"]], "daal4py.decision_tree_regression_model": [[0, 1, 1, "", "NumberOfFeatures"]], "daal4py.decision_tree_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.decision_tree_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.decision_tree_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.decision_tree_regression_training_result": [[0, 1, 1, "", "model"]], "daal4py.distributions_bernoulli": [[0, 2, 1, "", "compute"]], "daal4py.distributions_normal": [[0, 2, 1, "", "compute"]], "daal4py.distributions_uniform": [[0, 2, 1, "", "compute"]], "daal4py.em_gmm": [[0, 2, 1, "", "compute"]], "daal4py.em_gmm_init": [[0, 2, 1, "", "compute"]], "daal4py.em_gmm_init_result": [[0, 1, 1, "", "covariances"], [0, 1, 1, "", "means"], [0, 1, 1, "", "weights"]], "daal4py.em_gmm_result": [[0, 1, 1, "", "covariances"], [0, 1, 1, "", "goalFunction"], [0, 1, 1, "", "means"], [0, 1, 1, "", "nIterations"], [0, 1, 1, "", "weights"]], "daal4py.engines_mcg59": [[0, 2, 1, "", "compute"]], "daal4py.engines_mt19937": [[0, 2, 1, "", "compute"]], "daal4py.engines_mt2203": [[0, 2, 1, "", "compute"]], "daal4py.engines_result": [[0, 1, 1, "", "randomNumbers"]], "daal4py.gbt_classification_model": [[0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfTrees"], [0, 1, 1, "", "PredictionBias"]], "daal4py.gbt_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.gbt_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.gbt_classification_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "variableImportanceByCover"], [0, 1, 1, "", "variableImportanceByGain"], [0, 1, 1, "", "variableImportanceByTotalCover"], [0, 1, 1, "", "variableImportanceByTotalGain"], [0, 1, 1, "", "variableImportanceByWeight"]], "daal4py.gbt_regression_model": [[0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfTrees"], [0, 1, 1, "", "PredictionBias"]], "daal4py.gbt_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.gbt_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.gbt_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.gbt_regression_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "variableImportanceByCover"], [0, 1, 1, "", "variableImportanceByGain"], [0, 1, 1, "", "variableImportanceByTotalCover"], [0, 1, 1, "", "variableImportanceByTotalGain"], [0, 1, 1, "", "variableImportanceByWeight"]], "daal4py.implicit_als_model": [[0, 1, 1, "", "ItemsFactors"], [0, 1, 1, "", "UsersFactors"]], "daal4py.implicit_als_prediction_ratings": [[0, 2, 1, "", "compute"]], "daal4py.implicit_als_prediction_ratings_result": [[0, 1, 1, "", "prediction"]], "daal4py.implicit_als_training": [[0, 2, 1, "", "compute"]], "daal4py.implicit_als_training_result": [[0, 1, 1, "", "model"]], "daal4py.kdtree_knn_classification_model": [[0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"]], "daal4py.kdtree_knn_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.kdtree_knn_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.kdtree_knn_classification_training_result": [[0, 1, 1, "", "model"]], "daal4py.kmeans": [[0, 2, 1, "", "compute"]], "daal4py.kmeans_init": [[0, 2, 1, "", "compute"]], "daal4py.kmeans_init_result": [[0, 1, 1, "", "centroids"]], "daal4py.kmeans_result": [[0, 1, 1, "", "assignments"], [0, 1, 1, "", "centroids"], [0, 1, 1, "", "nIterations"], [0, 1, 1, "", "objectiveFunction"]], "daal4py.lasso_regression_model": [[0, 1, 1, "", "Beta"], [0, 1, 1, "", "InterceptFlag"], [0, 1, 1, "", "NumberOfBetas"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfResponses"]], "daal4py.lasso_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.lasso_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.lasso_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.lasso_regression_training_result": [[0, 1, 1, "", "gramMatrixId"], [0, 1, 1, "", "model"]], "daal4py.linear_regression_model": [[0, 1, 1, "", "Beta"], [0, 1, 1, "", "InterceptFlag"], [0, 1, 1, "", "NumberOfBetas"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfResponses"]], "daal4py.linear_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.linear_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.linear_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.linear_regression_training_result": [[0, 1, 1, "", "model"]], "daal4py.logistic_regression_model": [[0, 1, 1, "", "Beta"], [0, 1, 1, "", "InterceptFlag"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfBetas"], [0, 1, 1, "", "NumberOfFeatures"]], "daal4py.logistic_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.logistic_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.logistic_regression_training_result": [[0, 1, 1, "", "model"]], "daal4py.logitboost_model": [[0, 1, 1, "", "Iterations"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfWeakLearners"], [0, 2, 1, "", "WeakLearnerModel"]], "daal4py.logitboost_prediction": [[0, 2, 1, "", "compute"]], "daal4py.logitboost_training": [[0, 2, 1, "", "compute"]], "daal4py.logitboost_training_result": [[0, 1, 1, "", "model"]], "daal4py.low_order_moments": [[0, 2, 1, "", "compute"]], "daal4py.low_order_moments_result": [[0, 1, 1, "", "maximum"], [0, 1, 1, "", "mean"], [0, 1, 1, "", "minimum"], [0, 1, 1, "", "secondOrderRawMoment"], [0, 1, 1, "", "standardDeviation"], [0, 1, 1, "", "sum"], [0, 1, 1, "", "sumSquares"], [0, 1, 1, "", "sumSquaresCentered"], [0, 1, 1, "", "variance"], [0, 1, 1, "", "variation"]], "daal4py.multinomial_naive_bayes_model": [[0, 1, 1, "", "AuxTable"], [0, 1, 1, "", "LogP"], [0, 1, 1, "", "LogTheta"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"]], "daal4py.multinomial_naive_bayes_prediction": [[0, 2, 1, "", "compute"]], "daal4py.multinomial_naive_bayes_training": [[0, 2, 1, "", "compute"]], "daal4py.multinomial_naive_bayes_training_result": [[0, 1, 1, "", "model"]], "daal4py.multivariate_outlier_detection": [[0, 2, 1, "", "compute"]], "daal4py.multivariate_outlier_detection_result": [[0, 1, 1, "", "weights"]], "daal4py.normalization_minmax": [[0, 2, 1, "", "compute"]], "daal4py.normalization_minmax_result": [[0, 1, 1, "", "normalizedData"]], "daal4py.normalization_zscore": [[0, 2, 1, "", "compute"]], "daal4py.normalization_zscore_result": [[0, 1, 1, "", "means"], [0, 1, 1, "", "normalizedData"], [0, 1, 1, "", "variances"]], "daal4py.optimization_solver_adagrad": [[0, 2, 1, "", "compute"]], "daal4py.optimization_solver_adagrad_result": [[0, 1, 1, "", "minimum"], [0, 1, 1, "", "nIterations"]], "daal4py.optimization_solver_cross_entropy_loss": [[0, 2, 1, "", "compute"], [0, 2, 1, "", "setup"]], "daal4py.optimization_solver_lbfgs": [[0, 2, 1, "", "compute"]], "daal4py.optimization_solver_lbfgs_result": [[0, 1, 1, "", "minimum"], [0, 1, 1, "", "nIterations"]], "daal4py.optimization_solver_logistic_loss": [[0, 2, 1, "", "compute"], [0, 2, 1, "", "setup"]], "daal4py.optimization_solver_mse": [[0, 2, 1, "", "compute"], [0, 2, 1, "", "setup"]], "daal4py.optimization_solver_saga": [[0, 2, 1, "", "compute"]], "daal4py.optimization_solver_saga_result": [[0, 1, 1, "", "gradientsTable"], [0, 1, 1, "", "minimum"], [0, 1, 1, "", "nIterations"]], "daal4py.optimization_solver_sgd": [[0, 2, 1, "", "compute"]], "daal4py.optimization_solver_sgd_result": [[0, 1, 1, "", "minimum"], [0, 1, 1, "", "nIterations"]], "daal4py.pca": [[0, 2, 1, "", "compute"]], "daal4py.pca_result": [[0, 1, 1, "", "dataForTransform"], [0, 1, 1, "", "eigenvalues"], [0, 1, 1, "", "eigenvectors"], [0, 1, 1, "", "means"], [0, 1, 1, "", "variances"]], "daal4py.pca_transform": [[0, 2, 1, "", "compute"]], "daal4py.pca_transform_result": [[0, 1, 1, "", "transformedData"]], "daal4py.pivoted_qr": [[0, 2, 1, "", "compute"]], "daal4py.pivoted_qr_result": [[0, 1, 1, "", "matrixQ"], [0, 1, 1, "", "matrixR"], [0, 1, 1, "", "permutationMatrix"]], "daal4py.qr": [[0, 2, 1, "", "compute"]], "daal4py.qr_result": [[0, 1, 1, "", "matrixQ"], [0, 1, 1, "", "matrixR"]], "daal4py.quantiles": [[0, 2, 1, "", "compute"]], "daal4py.quantiles_result": [[0, 1, 1, "", "quantiles"]], "daal4py.ridge_regression_model": [[0, 1, 1, "", "Beta"], [0, 1, 1, "", "InterceptFlag"], [0, 1, 1, "", "NumberOfBetas"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "NumberOfResponses"]], "daal4py.ridge_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.ridge_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.ridge_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.ridge_regression_training_result": [[0, 1, 1, "", "model"]], "daal4py.sorting": [[0, 2, 1, "", "compute"]], "daal4py.sorting_result": [[0, 1, 1, "", "sortedData"]], "daal4py.stump_classification_model": [[0, 1, 1, "", "LeftValue"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "RightValue"], [0, 1, 1, "", "SplitFeature"], [0, 1, 1, "", "SplitValue"]], "daal4py.stump_classification_prediction": [[0, 2, 1, "", "compute"]], "daal4py.stump_classification_training": [[0, 2, 1, "", "compute"]], "daal4py.stump_classification_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "variableImportance"]], "daal4py.stump_regression_model": [[0, 1, 1, "", "LeftValue"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "RightValue"], [0, 1, 1, "", "SplitFeature"], [0, 1, 1, "", "SplitValue"]], "daal4py.stump_regression_prediction": [[0, 2, 1, "", "compute"]], "daal4py.stump_regression_prediction_result": [[0, 1, 1, "", "prediction"]], "daal4py.stump_regression_training": [[0, 2, 1, "", "compute"]], "daal4py.stump_regression_training_result": [[0, 1, 1, "", "model"], [0, 1, 1, "", "variableImportance"]], "daal4py.svd": [[0, 2, 1, "", "compute"]], "daal4py.svd_result": [[0, 1, 1, "", "leftSingularMatrix"], [0, 1, 1, "", "rightSingularMatrix"], [0, 1, 1, "", "singularValues"]], "daal4py.svm_model": [[0, 1, 1, "", "Bias"], [0, 1, 1, "", "ClassificationCoefficients"], [0, 1, 1, "", "NFeatures"], [0, 1, 1, "", "NumberOfFeatures"], [0, 1, 1, "", "SupportIndices"], [0, 1, 1, "", "SupportVectors"]], "daal4py.svm_prediction": [[0, 2, 1, "", "compute"]], "daal4py.svm_training": [[0, 2, 1, "", "compute"]], "daal4py.svm_training_result": [[0, 1, 1, "", "model"]], "daal4py.univariate_outlier_detection": [[0, 2, 1, "", "compute"]], "daal4py.univariate_outlier_detection_result": [[0, 1, 1, "", "weights"]]}, "objtypes": {"0": "py:class", "1": "py:attribute", "2": "py:method", "3": "py:function"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "attribute", "Python attribute"], "2": ["py", "method", "Python method"], "3": ["py", "function", "Python function"]}, "titleterms": {"algorithm": [0, 6, 8], "classif": [0, 5], "decis": 0, "forest": 0, "tree": 0, "gradient": [0, 5], "boost": [0, 5], "k": 0, "nearest": 0, "neighbor": 0, "knn": 0, "brute": 0, "forc": 0, "adaboost": 0, "brownboost": 0, "logitboost": 0, "stump": 0, "weak": 0, "learner": 0, "multinomi": 0, "naiv": 0, "bay": 0, "support": [0, 4, 6, 8], "vector": 0, "machin": [0, 4], "svm": 0, "logist": 0, "regress": [0, 5], "linear": 0, "least": 0, "absolut": 0, "shrinkag": 0, "select": 0, "oper": 0, "ridg": 0, "princip": 0, "compon": 0, "analysi": 0, "pca": 0, "transform": 0, "mean": 0, "cluster": 0, "initi": 0, "densiti": 0, "base": 0, "spatial": 0, "applic": 0, "nois": 0, "outlier": 0, "detect": 0, "multivari": 0, "univari": 0, "bacon": 0, "optim": 0, "solver": 0, "object": 0, "function": 0, "squar": 0, "error": 0, "mse": 0, "loss": 0, "cross": 0, "entropi": 0, "iter": 0, "stochast": 0, "descent": 0, "limit": [0, 5], "memori": [0, 6], "broyden": 0, "fletcher": 0, "goldfarb": 0, "shanno": 0, "adapt": 0, "subgradi": 0, "method": 0, "averag": 0, "distanc": 0, "cosin": 0, "matrix": [0, 2], "correl": 0, "expect": 0, "maxim": 0, "em": 0, "gaussian": 0, "mixtur": 0, "model": [0, 5], "qr": 0, "decomposit": 0, "without": 0, "pivot": 0, "normal": 0, "z": 0, "score": 0, "min": 0, "max": 0, "random": 0, "number": 0, "engin": 0, "mt19937": 0, "mt2203": 0, "mcg59": 0, "distribut": [0, 6], "bernoulli": 0, "uniform": 0, "associ": 0, "rule": 0, "choleski": 0, "varianc": 0, "covari": 0, "matric": 0, "implicit": 0, "altern": 0, "al": 0, "moment": 0, "low": 0, "order": 0, "quantil": 0, "singular": 0, "valu": [0, 5], "svd": 0, "sort": 0, "content": 1, "input": 2, "data": [2, 4, 8], "numpi": 2, "arrai": 2, "panda": 2, "datafram": 2, "scipi": 2, "spars": 2, "csr": 2, "csv": 2, "file": 2, "exampl": [3, 5, 6, 8], "gener": 3, "usag": [3, 4], "fast": 4, "scalabl": 4, "easi": [4, 6], "learn": [4, 5, 7], "With": 4, "daal4pi": 4, "design": 4, "scientist": 4, "framework": [4, 5], "api": [4, 7], "oneapi": 4, "gpu": 4, "": [4, 6], "built": 4, "perform": 4, "get": 4, "overview": 4, "scikit": [4, 5, 7], "patch": [4, 7], "builder": 5, "introduct": 5, "convers": 5, "infer": 5, "shap": 5, "calcul": 5, "style": 5, "estim": 5, "articl": 5, "blog": 5, "post": 5, "scale": 6, "multiprocess": 6, "It": 6, "deprec": 7, "notic": 7, "oned": 7, "acceler": 7, "verbos": 7, "stream": 8}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 8, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.todo": 2, "sphinx.ext.viewcode": 1, "sphinx": 57}, "alltitles": {"Algorithms": [[0, "algorithms"]], "Classification": [[0, "classification"]], "Decision Forest Classification": [[0, "decision-forest-classification"]], "Decision Tree Classification": [[0, "decision-tree-classification"]], "Gradient Boosted Classification": [[0, "gradient-boosted-classification"]], "k-Nearest Neighbors (kNN)": [[0, "k-nearest-neighbors-knn"]], "Brute-force k-Nearest Neighbors (kNN)": [[0, "brute-force-k-nearest-neighbors-knn"]], "AdaBoost Classification": [[0, "adaboost-classification"]], "BrownBoost Classification": [[0, "brownboost-classification"]], "LogitBoost Classification": [[0, "logitboost-classification"]], "Stump Weak Learner Classification": [[0, "stump-weak-learner-classification"]], "Multinomial Naive Bayes": [[0, "multinomial-naive-bayes"]], "Support Vector Machine (SVM)": [[0, "support-vector-machine-svm"]], "Logistic Regression": [[0, "logistic-regression"]], "Regression": [[0, "regression"]], "Decision Forest Regression": [[0, "decision-forest-regression"]], "Decision Tree Regression": [[0, "decision-tree-regression"]], "Gradient Boosted Regression": [[0, "gradient-boosted-regression"]], "Linear Regression": [[0, "linear-regression"]], "Least Absolute Shrinkage and Selection Operator": [[0, "least-absolute-shrinkage-and-selection-operator"]], "Ridge Regression": [[0, "ridge-regression"]], "Stump Regression": [[0, "stump-regression"]], "Principal Component Analysis (PCA)": [[0, "principal-component-analysis-pca"]], "Principal Component Analysis (PCA) Transform": [[0, "principal-component-analysis-pca-transform"]], "K-Means Clustering": [[0, "k-means-clustering"]], "K-Means Initialization": [[0, "k-means-initialization"]], "K-Means": [[0, "k-means"]], "Density-Based Spatial Clustering of Applications with Noise": [[0, "density-based-spatial-clustering-of-applications-with-noise"]], "Outlier Detection": [[0, "outlier-detection"]], "Multivariate Outlier Detection": [[0, "multivariate-outlier-detection"]], "Univariate Outlier Detection": [[0, "univariate-outlier-detection"]], "Multivariate Bacon Outlier Detection": [[0, "multivariate-bacon-outlier-detection"]], "Optimization Solvers": [[0, "optimization-solvers"]], "Objective Functions": [[0, "objective-functions"]], "Mean Squared Error Algorithm (MSE)": [[0, "mean-squared-error-algorithm-mse"]], "Logistic Loss": [[0, "logistic-loss"]], "Cross-entropy Loss": [[0, "cross-entropy-loss"]], "Iterative Solvers": [[0, "iterative-solvers"]], "Stochastic Gradient Descent Algorithm": [[0, "stochastic-gradient-descent-algorithm"]], "Limited-Memory Broyden-Fletcher-Goldfarb-Shanno Algorithm": [[0, "limited-memory-broyden-fletcher-goldfarb-shanno-algorithm"]], "Adaptive Subgradient Method": [[0, "adaptive-subgradient-method"]], "Stochastic Average Gradient Descent": [[0, "stochastic-average-gradient-descent"]], "Distances": [[0, "distances"]], "Cosine Distance Matrix": [[0, "cosine-distance-matrix"]], "Correlation Distance Matrix": [[0, "correlation-distance-matrix"]], "Expectation-Maximization (EM)": [[0, "expectation-maximization-em"]], "Initialization for the Gaussian Mixture Model": [[0, "initialization-for-the-gaussian-mixture-model"]], "EM algorithm for the Gaussian Mixture Model": [[0, "em-algorithm-for-the-gaussian-mixture-model"]], "QR Decomposition": [[0, "qr-decomposition"]], "QR Decomposition (without pivoting)": [[0, "qr-decomposition-without-pivoting"]], "Pivoted QR Decomposition": [[0, "pivoted-qr-decomposition"]], "Normalization": [[0, "normalization"]], "Z-Score": [[0, "z-score"]], "Min-Max": [[0, "min-max"]], "Random Number Engines": [[0, "random-number-engines"]], "mt19937": [[0, "mt19937"]], "mt2203": [[0, "mt2203"]], "mcg59": [[0, "mcg59"]], "Distributions": [[0, "distributions"]], "Bernoulli": [[0, "bernoulli"]], "Normal": [[0, "normal"]], "Uniform": [[0, "uniform"]], "Association Rules": [[0, "association-rules"]], "Cholesky Decomposition": [[0, "cholesky-decomposition"]], "Correlation and Variance-Covariance Matrices": [[0, "correlation-and-variance-covariance-matrices"]], "Implicit Alternating Least Squares (implicit ALS)": [[0, "implicit-alternating-least-squares-implicit-als"]], "Moments of Low Order": [[0, "moments-of-low-order"]], "Quantiles": [[0, "quantiles"]], "Singular Value Decomposition (SVD)": [[0, "singular-value-decomposition-svd"]], "Sorting": [[0, "sorting"]], "Trees": [[0, "trees"]], "Contents": [[1, "contents"]], "Contents:": [[1, null]], "Input Data": [[2, "input-data"]], "Numpy Arrays": [[2, "numpy-arrays"]], "Pandas DataFrames": [[2, "pandas-dataframes"]], "SciPy Sparse CSR Matrix": [[2, "scipy-sparse-csr-matrix"]], "CSV Files": [[2, "csv-files"]], "Examples": [[3, "examples"], [5, "examples"]], "General usage": [[3, "general-usage"]], "Fast, Scalable and Easy Machine Learning With DAAL4PY": [[4, "fast-scalable-and-easy-machine-learning-with-daal4py"]], "Designed for Data Scientists and Framework Designers": [[4, "designed-for-data-scientists-and-framework-designers"]], "API Design and usage": [[4, "api-design-and-usage"]], "oneAPI and GPU support in daal4py": [[4, "oneapi-and-gpu-support-in-daal4py"]], "Daal4py\u2019s Design": [[4, "daal4py-s-design"]], "Built for Performance": [[4, "built-for-performance"]], "Getting daal4py": [[4, "getting-daal4py"]], "Overview": [[4, "overview"]], "Scikit-Learn API and patching": [[4, "scikit-learn-api-and-patching"], [7, "scikit-learn-api-and-patching"]], "Model Builders for the Gradient Boosting Frameworks": [[5, "model-builders-for-the-gradient-boosting-frameworks"]], "Introduction": [[5, "introduction"]], "Conversion": [[5, "conversion"]], "Classification and Regression Inference": [[5, "classification-and-regression-inference"]], "SHAP Value Calculation for Regression Models": [[5, "shap-value-calculation-for-regression-models"]], "Scikit-learn-style Estimators": [[5, "scikit-learn-style-estimators"]], "Limitations": [[5, "limitations"]], "Articles and Blog Posts": [[5, "articles-and-blog-posts"]], "Scaling on Distributed Memory (Multiprocessing)": [[6, "scaling-on-distributed-memory-multiprocessing"]], "It\u2019s Easy": [[6, "it-s-easy"]], "Supported Algorithms and Examples": [[6, "supported-algorithms-and-examples"], [8, "supported-algorithms-and-examples"]], "Deprecation Notice": [[7, "deprecation-notice"]], "oneDAL accelerated scikit-learn": [[7, "onedal-accelerated-scikit-learn"]], "scikit-learn verbose": [[7, "scikit-learn-verbose"]], "scikit-learn API": [[7, "scikit-learn-api"]], "Streaming Data": [[8, "streaming-data"]]}, "indexentries": {"alpha (daal4py.adaboost_model attribute)": [[0, "daal4py.adaboost_model.Alpha"]], "alpha (daal4py.brownboost_model attribute)": [[0, "daal4py.brownboost_model.Alpha"]], "auxtable (daal4py.multinomial_naive_bayes_model attribute)": [[0, "daal4py.multinomial_naive_bayes_model.AuxTable"]], "beta (daal4py.lasso_regression_model attribute)": [[0, "daal4py.lasso_regression_model.Beta"]], "beta (daal4py.linear_regression_model attribute)": [[0, "daal4py.linear_regression_model.Beta"]], "beta (daal4py.logistic_regression_model attribute)": [[0, "daal4py.logistic_regression_model.Beta"]], "beta (daal4py.ridge_regression_model attribute)": [[0, "daal4py.ridge_regression_model.Beta"]], "bias (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.Bias"]], "classificationcoefficients (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.ClassificationCoefficients"]], "interceptflag (daal4py.lasso_regression_model attribute)": [[0, "daal4py.lasso_regression_model.InterceptFlag"]], "interceptflag (daal4py.linear_regression_model attribute)": [[0, "daal4py.linear_regression_model.InterceptFlag"]], "interceptflag (daal4py.logistic_regression_model attribute)": [[0, "daal4py.logistic_regression_model.InterceptFlag"]], "interceptflag (daal4py.ridge_regression_model attribute)": [[0, "daal4py.ridge_regression_model.InterceptFlag"]], "itemsfactors (daal4py.implicit_als_model attribute)": [[0, "daal4py.implicit_als_model.ItemsFactors"]], "iterations (daal4py.logitboost_model attribute)": [[0, "daal4py.logitboost_model.Iterations"]], "leftvalue (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.LeftValue"]], "leftvalue (daal4py.stump_regression_model attribute)": [[0, "daal4py.stump_regression_model.LeftValue"]], "logp (daal4py.multinomial_naive_bayes_model attribute)": [[0, "daal4py.multinomial_naive_bayes_model.LogP"]], "logtheta (daal4py.multinomial_naive_bayes_model attribute)": [[0, "daal4py.multinomial_naive_bayes_model.LogTheta"]], "nfeatures (daal4py.adaboost_model attribute)": [[0, "daal4py.adaboost_model.NFeatures"]], "nfeatures (daal4py.bf_knn_classification_model attribute)": [[0, "daal4py.bf_knn_classification_model.NFeatures"]], "nfeatures (daal4py.brownboost_model attribute)": [[0, "daal4py.brownboost_model.NFeatures"]], "nfeatures (daal4py.decision_forest_classification_model attribute)": [[0, "daal4py.decision_forest_classification_model.NFeatures"]], "nfeatures (daal4py.decision_tree_classification_model attribute)": [[0, "daal4py.decision_tree_classification_model.NFeatures"]], "nfeatures (daal4py.gbt_classification_model attribute)": [[0, "daal4py.gbt_classification_model.NFeatures"]], "nfeatures (daal4py.kdtree_knn_classification_model attribute)": [[0, "daal4py.kdtree_knn_classification_model.NFeatures"]], "nfeatures (daal4py.logistic_regression_model attribute)": [[0, "daal4py.logistic_regression_model.NFeatures"]], "nfeatures (daal4py.logitboost_model attribute)": [[0, "daal4py.logitboost_model.NFeatures"]], "nfeatures (daal4py.multinomial_naive_bayes_model attribute)": [[0, "daal4py.multinomial_naive_bayes_model.NFeatures"]], "nfeatures (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.NFeatures"]], "nfeatures (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.NFeatures"]], "numberofbetas (daal4py.lasso_regression_model attribute)": [[0, "daal4py.lasso_regression_model.NumberOfBetas"]], "numberofbetas (daal4py.linear_regression_model attribute)": [[0, "daal4py.linear_regression_model.NumberOfBetas"]], "numberofbetas (daal4py.logistic_regression_model attribute)": [[0, "daal4py.logistic_regression_model.NumberOfBetas"]], "numberofbetas (daal4py.ridge_regression_model attribute)": [[0, "daal4py.ridge_regression_model.NumberOfBetas"]], "numberofclasses (daal4py.decision_forest_classification_model attribute)": [[0, "daal4py.decision_forest_classification_model.NumberOfClasses"]], "numberoffeatures (daal4py.adaboost_model attribute)": [[0, "daal4py.adaboost_model.NumberOfFeatures"]], "numberoffeatures (daal4py.bf_knn_classification_model attribute)": [[0, "daal4py.bf_knn_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.brownboost_model attribute)": [[0, "daal4py.brownboost_model.NumberOfFeatures"]], "numberoffeatures (daal4py.decision_forest_classification_model attribute)": [[0, "daal4py.decision_forest_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.decision_forest_regression_model attribute)": [[0, "daal4py.decision_forest_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.decision_tree_classification_model attribute)": [[0, "daal4py.decision_tree_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.decision_tree_regression_model attribute)": [[0, "daal4py.decision_tree_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.gbt_classification_model attribute)": [[0, "daal4py.gbt_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.gbt_regression_model attribute)": [[0, "daal4py.gbt_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.kdtree_knn_classification_model attribute)": [[0, "daal4py.kdtree_knn_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.lasso_regression_model attribute)": [[0, "daal4py.lasso_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.linear_regression_model attribute)": [[0, "daal4py.linear_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.logistic_regression_model attribute)": [[0, "daal4py.logistic_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.logitboost_model attribute)": [[0, "daal4py.logitboost_model.NumberOfFeatures"]], "numberoffeatures (daal4py.multinomial_naive_bayes_model attribute)": [[0, "daal4py.multinomial_naive_bayes_model.NumberOfFeatures"]], "numberoffeatures (daal4py.ridge_regression_model attribute)": [[0, "daal4py.ridge_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.NumberOfFeatures"]], "numberoffeatures (daal4py.stump_regression_model attribute)": [[0, "daal4py.stump_regression_model.NumberOfFeatures"]], "numberoffeatures (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.NumberOfFeatures"]], "numberofresponses (daal4py.lasso_regression_model attribute)": [[0, "daal4py.lasso_regression_model.NumberOfResponses"]], "numberofresponses (daal4py.linear_regression_model attribute)": [[0, "daal4py.linear_regression_model.NumberOfResponses"]], "numberofresponses (daal4py.ridge_regression_model attribute)": [[0, "daal4py.ridge_regression_model.NumberOfResponses"]], "numberoftrees (daal4py.decision_forest_classification_model attribute)": [[0, "daal4py.decision_forest_classification_model.NumberOfTrees"]], "numberoftrees (daal4py.decision_forest_regression_model attribute)": [[0, "daal4py.decision_forest_regression_model.NumberOfTrees"]], "numberoftrees (daal4py.gbt_classification_model attribute)": [[0, "daal4py.gbt_classification_model.NumberOfTrees"]], "numberoftrees (daal4py.gbt_regression_model attribute)": [[0, "daal4py.gbt_regression_model.NumberOfTrees"]], "numberofweaklearners (daal4py.adaboost_model attribute)": [[0, "daal4py.adaboost_model.NumberOfWeakLearners"]], "numberofweaklearners (daal4py.brownboost_model attribute)": [[0, "daal4py.brownboost_model.NumberOfWeakLearners"]], "numberofweaklearners (daal4py.logitboost_model attribute)": [[0, "daal4py.logitboost_model.NumberOfWeakLearners"]], "predictionbias (daal4py.gbt_classification_model attribute)": [[0, "daal4py.gbt_classification_model.PredictionBias"]], "predictionbias (daal4py.gbt_regression_model attribute)": [[0, "daal4py.gbt_regression_model.PredictionBias"]], "rightvalue (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.RightValue"]], "rightvalue (daal4py.stump_regression_model attribute)": [[0, "daal4py.stump_regression_model.RightValue"]], "splitfeature (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.SplitFeature"]], "splitfeature (daal4py.stump_regression_model attribute)": [[0, "daal4py.stump_regression_model.SplitFeature"]], "splitvalue (daal4py.stump_classification_model attribute)": [[0, "daal4py.stump_classification_model.SplitValue"]], "splitvalue (daal4py.stump_regression_model attribute)": [[0, "daal4py.stump_regression_model.SplitValue"]], "supportindices (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.SupportIndices"]], "supportvectors (daal4py.svm_model attribute)": [[0, "daal4py.svm_model.SupportVectors"]], "usersfactors (daal4py.implicit_als_model attribute)": [[0, "daal4py.implicit_als_model.UsersFactors"]], "weaklearnermodel() (daal4py.adaboost_model method)": [[0, "daal4py.adaboost_model.WeakLearnerModel"]], "weaklearnermodel() (daal4py.brownboost_model method)": [[0, "daal4py.brownboost_model.WeakLearnerModel"]], "weaklearnermodel() (daal4py.logitboost_model method)": [[0, "daal4py.logitboost_model.WeakLearnerModel"]], "adaboost_model (class in daal4py)": [[0, "daal4py.adaboost_model"]], "adaboost_prediction (class in daal4py)": [[0, "daal4py.adaboost_prediction"]], "adaboost_training (class in daal4py)": [[0, "daal4py.adaboost_training"]], "adaboost_training_result (class in daal4py)": [[0, "daal4py.adaboost_training_result"]], "antecedentitemsets (daal4py.association_rules_result attribute)": [[0, "daal4py.association_rules_result.antecedentItemsets"]], "assignments (daal4py.dbscan_result attribute)": [[0, "daal4py.dbscan_result.assignments"]], "assignments (daal4py.kmeans_result attribute)": [[0, "daal4py.kmeans_result.assignments"]], "association_rules (class in daal4py)": [[0, "daal4py.association_rules"]], "association_rules_result (class in daal4py)": [[0, "daal4py.association_rules_result"]], "bacon_outlier_detection (class in daal4py)": [[0, "daal4py.bacon_outlier_detection"]], "bacon_outlier_detection_result (class in daal4py)": [[0, "daal4py.bacon_outlier_detection_result"]], "bf_knn_classification_model (class in daal4py)": [[0, "daal4py.bf_knn_classification_model"]], "bf_knn_classification_prediction (class in daal4py)": [[0, "daal4py.bf_knn_classification_prediction"]], "bf_knn_classification_training (class in daal4py)": [[0, "daal4py.bf_knn_classification_training"]], "bf_knn_classification_training_result (class in daal4py)": [[0, "daal4py.bf_knn_classification_training_result"]], "brownboost_model (class in daal4py)": [[0, "daal4py.brownboost_model"]], "brownboost_prediction (class in daal4py)": [[0, "daal4py.brownboost_prediction"]], "brownboost_training (class in daal4py)": [[0, "daal4py.brownboost_training"]], "brownboost_training_result (class in daal4py)": [[0, "daal4py.brownboost_training_result"]], "centroids (daal4py.kmeans_init_result attribute)": [[0, "daal4py.kmeans_init_result.centroids"]], "centroids (daal4py.kmeans_result attribute)": [[0, "daal4py.kmeans_result.centroids"]], "cholesky (class in daal4py)": [[0, "daal4py.cholesky"]], "choleskyfactor (daal4py.cholesky_result attribute)": [[0, "daal4py.cholesky_result.choleskyFactor"]], "cholesky_result (class in daal4py)": [[0, "daal4py.cholesky_result"]], "classifier_prediction_result (class in daal4py)": [[0, "daal4py.classifier_prediction_result"], [0, "id0"], [0, "id12"], [0, "id16"], [0, "id20"], [0, "id24"], [0, "id28"], [0, "id32"], [0, "id36"], [0, "id4"], [0, "id40"], [0, "id8"]], "compute() (daal4py.adaboost_prediction method)": [[0, "daal4py.adaboost_prediction.compute"]], "compute() (daal4py.adaboost_training method)": [[0, "daal4py.adaboost_training.compute"]], "compute() (daal4py.association_rules method)": [[0, "daal4py.association_rules.compute"]], "compute() (daal4py.bacon_outlier_detection method)": [[0, "daal4py.bacon_outlier_detection.compute"]], "compute() (daal4py.bf_knn_classification_prediction method)": [[0, "daal4py.bf_knn_classification_prediction.compute"]], "compute() (daal4py.bf_knn_classification_training method)": [[0, "daal4py.bf_knn_classification_training.compute"]], "compute() (daal4py.brownboost_prediction method)": [[0, "daal4py.brownboost_prediction.compute"]], "compute() (daal4py.brownboost_training method)": [[0, "daal4py.brownboost_training.compute"]], "compute() (daal4py.cholesky method)": [[0, "daal4py.cholesky.compute"]], "compute() (daal4py.correlation_distance method)": [[0, "daal4py.correlation_distance.compute"]], "compute() (daal4py.cosine_distance method)": [[0, "daal4py.cosine_distance.compute"]], "compute() (daal4py.covariance method)": [[0, "daal4py.covariance.compute"]], "compute() (daal4py.dbscan method)": [[0, "daal4py.dbscan.compute"]], "compute() (daal4py.decision_forest_classification_prediction method)": [[0, "daal4py.decision_forest_classification_prediction.compute"]], "compute() (daal4py.decision_forest_classification_training method)": [[0, "daal4py.decision_forest_classification_training.compute"]], "compute() (daal4py.decision_forest_regression_prediction method)": [[0, "daal4py.decision_forest_regression_prediction.compute"]], "compute() (daal4py.decision_forest_regression_training method)": [[0, "daal4py.decision_forest_regression_training.compute"]], "compute() (daal4py.decision_tree_classification_prediction method)": [[0, "daal4py.decision_tree_classification_prediction.compute"]], "compute() (daal4py.decision_tree_classification_training method)": [[0, "daal4py.decision_tree_classification_training.compute"]], "compute() (daal4py.decision_tree_regression_prediction method)": [[0, "daal4py.decision_tree_regression_prediction.compute"]], "compute() (daal4py.decision_tree_regression_training method)": [[0, "daal4py.decision_tree_regression_training.compute"]], "compute() (daal4py.distributions_bernoulli method)": [[0, "daal4py.distributions_bernoulli.compute"]], "compute() (daal4py.distributions_normal method)": [[0, "daal4py.distributions_normal.compute"]], "compute() (daal4py.distributions_uniform method)": [[0, "daal4py.distributions_uniform.compute"]], "compute() (daal4py.em_gmm method)": [[0, "daal4py.em_gmm.compute"]], "compute() (daal4py.em_gmm_init method)": [[0, "daal4py.em_gmm_init.compute"]], "compute() (daal4py.engines_mcg59 method)": [[0, "daal4py.engines_mcg59.compute"]], "compute() (daal4py.engines_mt19937 method)": [[0, "daal4py.engines_mt19937.compute"]], "compute() (daal4py.engines_mt2203 method)": [[0, "daal4py.engines_mt2203.compute"]], "compute() (daal4py.gbt_classification_prediction method)": [[0, "daal4py.gbt_classification_prediction.compute"]], "compute() (daal4py.gbt_classification_training method)": [[0, "daal4py.gbt_classification_training.compute"]], "compute() (daal4py.gbt_regression_prediction method)": [[0, "daal4py.gbt_regression_prediction.compute"]], "compute() (daal4py.gbt_regression_training method)": [[0, "daal4py.gbt_regression_training.compute"]], "compute() (daal4py.implicit_als_prediction_ratings method)": [[0, "daal4py.implicit_als_prediction_ratings.compute"]], "compute() (daal4py.implicit_als_training method)": [[0, "daal4py.implicit_als_training.compute"]], "compute() (daal4py.kdtree_knn_classification_prediction method)": [[0, "daal4py.kdtree_knn_classification_prediction.compute"]], "compute() (daal4py.kdtree_knn_classification_training method)": [[0, "daal4py.kdtree_knn_classification_training.compute"]], "compute() (daal4py.kmeans method)": [[0, "daal4py.kmeans.compute"]], "compute() (daal4py.kmeans_init method)": [[0, "daal4py.kmeans_init.compute"]], "compute() (daal4py.lasso_regression_prediction method)": [[0, "daal4py.lasso_regression_prediction.compute"]], "compute() (daal4py.lasso_regression_training method)": [[0, "daal4py.lasso_regression_training.compute"]], "compute() (daal4py.linear_regression_prediction method)": [[0, "daal4py.linear_regression_prediction.compute"]], "compute() (daal4py.linear_regression_training method)": [[0, "daal4py.linear_regression_training.compute"]], "compute() (daal4py.logistic_regression_prediction method)": [[0, "daal4py.logistic_regression_prediction.compute"]], "compute() (daal4py.logistic_regression_training method)": [[0, "daal4py.logistic_regression_training.compute"]], "compute() (daal4py.logitboost_prediction method)": [[0, "daal4py.logitboost_prediction.compute"]], "compute() (daal4py.logitboost_training method)": [[0, "daal4py.logitboost_training.compute"]], "compute() (daal4py.low_order_moments method)": [[0, "daal4py.low_order_moments.compute"]], "compute() (daal4py.multinomial_naive_bayes_prediction method)": [[0, "daal4py.multinomial_naive_bayes_prediction.compute"]], "compute() (daal4py.multinomial_naive_bayes_training method)": [[0, "daal4py.multinomial_naive_bayes_training.compute"]], "compute() (daal4py.multivariate_outlier_detection method)": [[0, "daal4py.multivariate_outlier_detection.compute"]], "compute() (daal4py.normalization_minmax method)": [[0, "daal4py.normalization_minmax.compute"]], "compute() (daal4py.normalization_zscore method)": [[0, "daal4py.normalization_zscore.compute"]], "compute() (daal4py.optimization_solver_adagrad method)": [[0, "daal4py.optimization_solver_adagrad.compute"]], "compute() (daal4py.optimization_solver_cross_entropy_loss method)": [[0, "daal4py.optimization_solver_cross_entropy_loss.compute"]], "compute() (daal4py.optimization_solver_lbfgs method)": [[0, "daal4py.optimization_solver_lbfgs.compute"]], "compute() (daal4py.optimization_solver_logistic_loss method)": [[0, "daal4py.optimization_solver_logistic_loss.compute"]], "compute() (daal4py.optimization_solver_mse method)": [[0, "daal4py.optimization_solver_mse.compute"]], "compute() (daal4py.optimization_solver_saga method)": [[0, "daal4py.optimization_solver_saga.compute"]], "compute() (daal4py.optimization_solver_sgd method)": [[0, "daal4py.optimization_solver_sgd.compute"]], "compute() (daal4py.pca method)": [[0, "daal4py.pca.compute"]], "compute() (daal4py.pca_transform method)": [[0, "daal4py.pca_transform.compute"]], "compute() (daal4py.pivoted_qr method)": [[0, "daal4py.pivoted_qr.compute"]], "compute() (daal4py.qr method)": [[0, "daal4py.qr.compute"]], "compute() (daal4py.quantiles method)": [[0, "daal4py.quantiles.compute"]], "compute() (daal4py.ridge_regression_prediction method)": [[0, "daal4py.ridge_regression_prediction.compute"]], "compute() (daal4py.ridge_regression_training method)": [[0, "daal4py.ridge_regression_training.compute"]], "compute() (daal4py.sorting method)": [[0, "daal4py.sorting.compute"]], "compute() (daal4py.stump_classification_prediction method)": [[0, "daal4py.stump_classification_prediction.compute"]], "compute() (daal4py.stump_classification_training method)": [[0, "daal4py.stump_classification_training.compute"]], "compute() (daal4py.stump_regression_prediction method)": [[0, "daal4py.stump_regression_prediction.compute"]], "compute() (daal4py.stump_regression_training method)": [[0, "daal4py.stump_regression_training.compute"]], "compute() (daal4py.svd method)": [[0, "daal4py.svd.compute"]], "compute() (daal4py.svm_prediction method)": [[0, "daal4py.svm_prediction.compute"]], "compute() (daal4py.svm_training method)": [[0, "daal4py.svm_training.compute"]], "compute() (daal4py.univariate_outlier_detection method)": [[0, "daal4py.univariate_outlier_detection.compute"]], "confidence (daal4py.association_rules_result attribute)": [[0, "daal4py.association_rules_result.confidence"]], "consequentitemsets (daal4py.association_rules_result attribute)": [[0, "daal4py.association_rules_result.consequentItemsets"]], "coreindices (daal4py.dbscan_result attribute)": [[0, "daal4py.dbscan_result.coreIndices"]], "coreobservations (daal4py.dbscan_result attribute)": [[0, "daal4py.dbscan_result.coreObservations"]], "correlation (daal4py.covariance_result attribute)": [[0, "daal4py.covariance_result.correlation"]], "correlationdistance (daal4py.correlation_distance_result attribute)": [[0, "daal4py.correlation_distance_result.correlationDistance"]], "correlation_distance (class in daal4py)": [[0, "daal4py.correlation_distance"]], "correlation_distance_result (class in daal4py)": [[0, "daal4py.correlation_distance_result"]], "cosinedistance (daal4py.cosine_distance_result attribute)": [[0, "daal4py.cosine_distance_result.cosineDistance"]], "cosine_distance (class in daal4py)": [[0, "daal4py.cosine_distance"]], "cosine_distance_result (class in daal4py)": [[0, "daal4py.cosine_distance_result"]], "covariance (class in daal4py)": [[0, "daal4py.covariance"]], "covariance (daal4py.covariance_result attribute)": [[0, "daal4py.covariance_result.covariance"]], "covariance_result (class in daal4py)": [[0, "daal4py.covariance_result"]], "covariances (daal4py.em_gmm_init_result attribute)": [[0, "daal4py.em_gmm_init_result.covariances"]], "covariances (daal4py.em_gmm_result attribute)": [[0, "daal4py.em_gmm_result.covariances"]], "datafortransform (daal4py.pca_result attribute)": [[0, "daal4py.pca_result.dataForTransform"]], "dbscan (class in daal4py)": [[0, "daal4py.dbscan"]], "dbscan_result (class in daal4py)": [[0, "daal4py.dbscan_result"]], "decision_forest_classification_model (class in daal4py)": [[0, "daal4py.decision_forest_classification_model"]], "decision_forest_classification_prediction (class in daal4py)": [[0, "daal4py.decision_forest_classification_prediction"]], "decision_forest_classification_training (class in daal4py)": [[0, "daal4py.decision_forest_classification_training"]], "decision_forest_classification_training_result (class in daal4py)": [[0, "daal4py.decision_forest_classification_training_result"]], "decision_forest_regression_model (class in daal4py)": [[0, "daal4py.decision_forest_regression_model"]], "decision_forest_regression_prediction (class in daal4py)": [[0, "daal4py.decision_forest_regression_prediction"]], "decision_forest_regression_prediction_result (class in daal4py)": [[0, "daal4py.decision_forest_regression_prediction_result"]], "decision_forest_regression_training (class in daal4py)": [[0, "daal4py.decision_forest_regression_training"]], "decision_forest_regression_training_result (class in daal4py)": [[0, "daal4py.decision_forest_regression_training_result"]], "decision_tree_classification_model (class in daal4py)": [[0, "daal4py.decision_tree_classification_model"]], "decision_tree_classification_prediction (class in daal4py)": [[0, "daal4py.decision_tree_classification_prediction"]], "decision_tree_classification_training (class in daal4py)": [[0, "daal4py.decision_tree_classification_training"]], "decision_tree_classification_training_result (class in daal4py)": [[0, "daal4py.decision_tree_classification_training_result"]], "decision_tree_regression_model (class in daal4py)": [[0, "daal4py.decision_tree_regression_model"]], "decision_tree_regression_prediction (class in daal4py)": [[0, "daal4py.decision_tree_regression_prediction"]], "decision_tree_regression_prediction_result (class in daal4py)": [[0, "daal4py.decision_tree_regression_prediction_result"]], "decision_tree_regression_training (class in daal4py)": [[0, "daal4py.decision_tree_regression_training"]], "decision_tree_regression_training_result (class in daal4py)": [[0, "daal4py.decision_tree_regression_training_result"]], "distributions_bernoulli (class in daal4py)": [[0, "daal4py.distributions_bernoulli"]], "distributions_bernoulli_result (in module daal4py)": [[0, "daal4py.distributions_bernoulli_result"]], "distributions_normal (class in daal4py)": [[0, "daal4py.distributions_normal"]], "distributions_normal_result (in module daal4py)": [[0, "daal4py.distributions_normal_result"]], "distributions_uniform (class in daal4py)": [[0, "daal4py.distributions_uniform"]], "distributions_uniform_result (in module daal4py)": [[0, "daal4py.distributions_uniform_result"]], "eigenvalues (daal4py.pca_result attribute)": [[0, "daal4py.pca_result.eigenvalues"]], "eigenvectors (daal4py.pca_result attribute)": [[0, "daal4py.pca_result.eigenvectors"]], "em_gmm (class in daal4py)": [[0, "daal4py.em_gmm"]], "em_gmm_init (class in daal4py)": [[0, "daal4py.em_gmm_init"]], "em_gmm_init_result (class in daal4py)": [[0, "daal4py.em_gmm_init_result"]], "em_gmm_result (class in daal4py)": [[0, "daal4py.em_gmm_result"]], "engines_mcg59 (class in daal4py)": [[0, "daal4py.engines_mcg59"]], "engines_mcg59_result (in module daal4py)": [[0, "daal4py.engines_mcg59_result"]], "engines_mt19937 (class in daal4py)": [[0, "daal4py.engines_mt19937"]], "engines_mt19937_result (in module daal4py)": [[0, "daal4py.engines_mt19937_result"]], "engines_mt2203 (class in daal4py)": [[0, "daal4py.engines_mt2203"]], "engines_mt2203_result (in module daal4py)": [[0, "daal4py.engines_mt2203_result"]], "engines_result (class in daal4py)": [[0, "daal4py.engines_result"]], "gbt_classification_model (class in daal4py)": [[0, "daal4py.gbt_classification_model"]], "gbt_classification_prediction (class in daal4py)": [[0, "daal4py.gbt_classification_prediction"]], "gbt_classification_training (class in daal4py)": [[0, "daal4py.gbt_classification_training"]], "gbt_classification_training_result (class in daal4py)": [[0, "daal4py.gbt_classification_training_result"]], "gbt_regression_model (class in daal4py)": [[0, "daal4py.gbt_regression_model"]], "gbt_regression_prediction (class in daal4py)": [[0, "daal4py.gbt_regression_prediction"]], "gbt_regression_prediction_result (class in daal4py)": [[0, "daal4py.gbt_regression_prediction_result"]], "gbt_regression_training (class in daal4py)": [[0, "daal4py.gbt_regression_training"]], "gbt_regression_training_result (class in daal4py)": [[0, "daal4py.gbt_regression_training_result"]], "gettreestate() (in module daal4py)": [[0, "daal4py.getTreeState"]], "goalfunction (daal4py.em_gmm_result attribute)": [[0, "daal4py.em_gmm_result.goalFunction"]], "gradientstable (daal4py.optimization_solver_saga_result attribute)": [[0, "daal4py.optimization_solver_saga_result.gradientsTable"]], "grammatrixid (daal4py.lasso_regression_training_result attribute)": [[0, "daal4py.lasso_regression_training_result.gramMatrixId"]], "implicit_als_model (class in daal4py)": [[0, "daal4py.implicit_als_model"]], "implicit_als_prediction_ratings (class in daal4py)": [[0, "daal4py.implicit_als_prediction_ratings"]], "implicit_als_prediction_ratings_result (class in daal4py)": [[0, "daal4py.implicit_als_prediction_ratings_result"]], "implicit_als_training (class in daal4py)": [[0, "daal4py.implicit_als_training"]], "implicit_als_training_result (class in daal4py)": [[0, "daal4py.implicit_als_training_result"]], "kdtree_knn_classification_model (class in daal4py)": [[0, "daal4py.kdtree_knn_classification_model"]], "kdtree_knn_classification_prediction (class in daal4py)": [[0, "daal4py.kdtree_knn_classification_prediction"]], "kdtree_knn_classification_training (class in daal4py)": [[0, "daal4py.kdtree_knn_classification_training"]], "kdtree_knn_classification_training_result (class in daal4py)": [[0, "daal4py.kdtree_knn_classification_training_result"]], "kmeans (class in daal4py)": [[0, "daal4py.kmeans"]], "kmeans_init (class in daal4py)": [[0, "daal4py.kmeans_init"]], "kmeans_init_result (class in daal4py)": [[0, "daal4py.kmeans_init_result"]], "kmeans_result (class in daal4py)": [[0, "daal4py.kmeans_result"]], "largeitemsets (daal4py.association_rules_result attribute)": [[0, "daal4py.association_rules_result.largeItemsets"]], "largeitemsetssupport (daal4py.association_rules_result attribute)": [[0, "daal4py.association_rules_result.largeItemsetsSupport"]], "lasso_regression_model (class in daal4py)": [[0, "daal4py.lasso_regression_model"]], "lasso_regression_prediction (class in daal4py)": [[0, "daal4py.lasso_regression_prediction"]], "lasso_regression_prediction_result (class in daal4py)": [[0, "daal4py.lasso_regression_prediction_result"]], "lasso_regression_training (class in daal4py)": [[0, "daal4py.lasso_regression_training"]], "lasso_regression_training_result (class in daal4py)": [[0, "daal4py.lasso_regression_training_result"]], "leftsingularmatrix (daal4py.svd_result attribute)": [[0, "daal4py.svd_result.leftSingularMatrix"]], "linear_regression_model (class in daal4py)": [[0, "daal4py.linear_regression_model"]], "linear_regression_prediction (class in daal4py)": [[0, "daal4py.linear_regression_prediction"]], "linear_regression_prediction_result (class in daal4py)": [[0, "daal4py.linear_regression_prediction_result"]], "linear_regression_training (class in daal4py)": [[0, "daal4py.linear_regression_training"]], "linear_regression_training_result (class in daal4py)": [[0, "daal4py.linear_regression_training_result"]], "logprobabilities (daal4py.classifier_prediction_result attribute)": [[0, "daal4py.classifier_prediction_result.logProbabilities"], [0, "id1"], [0, "id13"], [0, "id17"], [0, "id21"], [0, "id25"], [0, "id29"], [0, "id33"], [0, "id37"], [0, "id41"], [0, "id5"], [0, "id9"]], "logistic_regression_model (class in daal4py)": [[0, "daal4py.logistic_regression_model"]], "logistic_regression_prediction (class in daal4py)": [[0, "daal4py.logistic_regression_prediction"]], "logistic_regression_training (class in daal4py)": [[0, "daal4py.logistic_regression_training"]], "logistic_regression_training_result (class in daal4py)": [[0, "daal4py.logistic_regression_training_result"]], "logitboost_model (class in daal4py)": [[0, "daal4py.logitboost_model"]], "logitboost_prediction (class in daal4py)": [[0, "daal4py.logitboost_prediction"]], "logitboost_training (class in daal4py)": [[0, "daal4py.logitboost_training"]], "logitboost_training_result (class in daal4py)": [[0, "daal4py.logitboost_training_result"]], "low_order_moments (class in daal4py)": [[0, "daal4py.low_order_moments"]], "low_order_moments_result (class in daal4py)": [[0, "daal4py.low_order_moments_result"]], "matrixq (daal4py.pivoted_qr_result attribute)": [[0, "daal4py.pivoted_qr_result.matrixQ"]], "matrixq (daal4py.qr_result attribute)": [[0, "daal4py.qr_result.matrixQ"]], "matrixr (daal4py.pivoted_qr_result attribute)": [[0, "daal4py.pivoted_qr_result.matrixR"]], "matrixr (daal4py.qr_result attribute)": [[0, "daal4py.qr_result.matrixR"]], "maximum (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.maximum"]], "mean (daal4py.covariance_result attribute)": [[0, "daal4py.covariance_result.mean"]], "mean (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.mean"]], "means (daal4py.em_gmm_init_result attribute)": [[0, "daal4py.em_gmm_init_result.means"]], "means (daal4py.em_gmm_result attribute)": [[0, "daal4py.em_gmm_result.means"]], "means (daal4py.normalization_zscore_result attribute)": [[0, "daal4py.normalization_zscore_result.means"]], "means (daal4py.pca_result attribute)": [[0, "daal4py.pca_result.means"]], "minimum (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.minimum"]], "minimum (daal4py.optimization_solver_adagrad_result attribute)": [[0, "daal4py.optimization_solver_adagrad_result.minimum"]], "minimum (daal4py.optimization_solver_lbfgs_result attribute)": [[0, "daal4py.optimization_solver_lbfgs_result.minimum"]], "minimum (daal4py.optimization_solver_saga_result attribute)": [[0, "daal4py.optimization_solver_saga_result.minimum"]], "minimum (daal4py.optimization_solver_sgd_result attribute)": [[0, "daal4py.optimization_solver_sgd_result.minimum"]], "model (daal4py.adaboost_training_result attribute)": [[0, "daal4py.adaboost_training_result.model"]], "model (daal4py.bf_knn_classification_training_result attribute)": [[0, "daal4py.bf_knn_classification_training_result.model"]], "model (daal4py.brownboost_training_result attribute)": [[0, "daal4py.brownboost_training_result.model"]], "model (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.model"]], "model (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.model"]], "model (daal4py.decision_tree_classification_training_result attribute)": [[0, "daal4py.decision_tree_classification_training_result.model"]], "model (daal4py.decision_tree_regression_training_result attribute)": [[0, "daal4py.decision_tree_regression_training_result.model"]], "model (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.model"]], "model (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.model"]], "model (daal4py.implicit_als_training_result attribute)": [[0, "daal4py.implicit_als_training_result.model"]], "model (daal4py.kdtree_knn_classification_training_result attribute)": [[0, "daal4py.kdtree_knn_classification_training_result.model"]], "model (daal4py.lasso_regression_training_result attribute)": [[0, "daal4py.lasso_regression_training_result.model"]], "model (daal4py.linear_regression_training_result attribute)": [[0, "daal4py.linear_regression_training_result.model"]], "model (daal4py.logistic_regression_training_result attribute)": [[0, "daal4py.logistic_regression_training_result.model"]], "model (daal4py.logitboost_training_result attribute)": [[0, "daal4py.logitboost_training_result.model"]], "model (daal4py.multinomial_naive_bayes_training_result attribute)": [[0, "daal4py.multinomial_naive_bayes_training_result.model"]], "model (daal4py.ridge_regression_training_result attribute)": [[0, "daal4py.ridge_regression_training_result.model"]], "model (daal4py.stump_classification_training_result attribute)": [[0, "daal4py.stump_classification_training_result.model"]], "model (daal4py.stump_regression_training_result attribute)": [[0, "daal4py.stump_regression_training_result.model"]], "model (daal4py.svm_training_result attribute)": [[0, "daal4py.svm_training_result.model"]], "multinomial_naive_bayes_model (class in daal4py)": [[0, "daal4py.multinomial_naive_bayes_model"]], "multinomial_naive_bayes_prediction (class in daal4py)": [[0, "daal4py.multinomial_naive_bayes_prediction"]], "multinomial_naive_bayes_training (class in daal4py)": [[0, "daal4py.multinomial_naive_bayes_training"]], "multinomial_naive_bayes_training_result (class in daal4py)": [[0, "daal4py.multinomial_naive_bayes_training_result"]], "multivariate_outlier_detection (class in daal4py)": [[0, "daal4py.multivariate_outlier_detection"]], "multivariate_outlier_detection_result (class in daal4py)": [[0, "daal4py.multivariate_outlier_detection_result"]], "nclusters (daal4py.dbscan_result attribute)": [[0, "daal4py.dbscan_result.nClusters"]], "niterations (daal4py.em_gmm_result attribute)": [[0, "daal4py.em_gmm_result.nIterations"]], "niterations (daal4py.kmeans_result attribute)": [[0, "daal4py.kmeans_result.nIterations"]], "niterations (daal4py.optimization_solver_adagrad_result attribute)": [[0, "daal4py.optimization_solver_adagrad_result.nIterations"]], "niterations (daal4py.optimization_solver_lbfgs_result attribute)": [[0, "daal4py.optimization_solver_lbfgs_result.nIterations"]], "niterations (daal4py.optimization_solver_saga_result attribute)": [[0, "daal4py.optimization_solver_saga_result.nIterations"]], "niterations (daal4py.optimization_solver_sgd_result attribute)": [[0, "daal4py.optimization_solver_sgd_result.nIterations"]], "normalization_minmax (class in daal4py)": [[0, "daal4py.normalization_minmax"]], "normalization_minmax_result (class in daal4py)": [[0, "daal4py.normalization_minmax_result"]], "normalization_zscore (class in daal4py)": [[0, "daal4py.normalization_zscore"]], "normalization_zscore_result (class in daal4py)": [[0, "daal4py.normalization_zscore_result"]], "normalizeddata (daal4py.normalization_minmax_result attribute)": [[0, "daal4py.normalization_minmax_result.normalizedData"]], "normalizeddata (daal4py.normalization_zscore_result attribute)": [[0, "daal4py.normalization_zscore_result.normalizedData"]], "objectivefunction (daal4py.kmeans_result attribute)": [[0, "daal4py.kmeans_result.objectiveFunction"]], "optimization_solver_adagrad (class in daal4py)": [[0, "daal4py.optimization_solver_adagrad"]], "optimization_solver_adagrad_result (class in daal4py)": [[0, "daal4py.optimization_solver_adagrad_result"]], "optimization_solver_cross_entropy_loss (class in daal4py)": [[0, "daal4py.optimization_solver_cross_entropy_loss"]], "optimization_solver_cross_entropy_loss_result (in module daal4py)": [[0, "daal4py.optimization_solver_cross_entropy_loss_result"]], "optimization_solver_lbfgs (class in daal4py)": [[0, "daal4py.optimization_solver_lbfgs"]], "optimization_solver_lbfgs_result (class in daal4py)": [[0, "daal4py.optimization_solver_lbfgs_result"]], "optimization_solver_logistic_loss (class in daal4py)": [[0, "daal4py.optimization_solver_logistic_loss"]], "optimization_solver_logistic_loss_result (in module daal4py)": [[0, "daal4py.optimization_solver_logistic_loss_result"]], "optimization_solver_mse (class in daal4py)": [[0, "daal4py.optimization_solver_mse"]], "optimization_solver_mse_result (in module daal4py)": [[0, "daal4py.optimization_solver_mse_result"]], "optimization_solver_saga (class in daal4py)": [[0, "daal4py.optimization_solver_saga"]], "optimization_solver_saga_result (class in daal4py)": [[0, "daal4py.optimization_solver_saga_result"]], "optimization_solver_sgd (class in daal4py)": [[0, "daal4py.optimization_solver_sgd"]], "optimization_solver_sgd_result (class in daal4py)": [[0, "daal4py.optimization_solver_sgd_result"]], "outofbagerror (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.outOfBagError"]], "outofbagerror (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.outOfBagError"]], "outofbagerroraccuracy (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.outOfBagErrorAccuracy"]], "outofbagerrordecisionfunction (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.outOfBagErrorDecisionFunction"]], "outofbagerrorperobservation (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.outOfBagErrorPerObservation"]], "outofbagerrorperobservation (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.outOfBagErrorPerObservation"]], "outofbagerrorprediction (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.outOfBagErrorPrediction"]], "outofbagerrorr2 (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.outOfBagErrorR2"]], "pca (class in daal4py)": [[0, "daal4py.pca"]], "pca_result (class in daal4py)": [[0, "daal4py.pca_result"]], "pca_transform (class in daal4py)": [[0, "daal4py.pca_transform"]], "pca_transform_result (class in daal4py)": [[0, "daal4py.pca_transform_result"]], "permutationmatrix (daal4py.pivoted_qr_result attribute)": [[0, "daal4py.pivoted_qr_result.permutationMatrix"]], "pivoted_qr (class in daal4py)": [[0, "daal4py.pivoted_qr"]], "pivoted_qr_result (class in daal4py)": [[0, "daal4py.pivoted_qr_result"]], "prediction (daal4py.classifier_prediction_result attribute)": [[0, "daal4py.classifier_prediction_result.prediction"], [0, "id10"], [0, "id14"], [0, "id18"], [0, "id2"], [0, "id22"], [0, "id26"], [0, "id30"], [0, "id34"], [0, "id38"], [0, "id42"], [0, "id6"]], "prediction (daal4py.decision_forest_regression_prediction_result attribute)": [[0, "daal4py.decision_forest_regression_prediction_result.prediction"]], "prediction (daal4py.decision_tree_regression_prediction_result attribute)": [[0, "daal4py.decision_tree_regression_prediction_result.prediction"]], "prediction (daal4py.gbt_regression_prediction_result attribute)": [[0, "daal4py.gbt_regression_prediction_result.prediction"]], "prediction (daal4py.implicit_als_prediction_ratings_result attribute)": [[0, "daal4py.implicit_als_prediction_ratings_result.prediction"]], "prediction (daal4py.lasso_regression_prediction_result attribute)": [[0, "daal4py.lasso_regression_prediction_result.prediction"]], "prediction (daal4py.linear_regression_prediction_result attribute)": [[0, "daal4py.linear_regression_prediction_result.prediction"]], "prediction (daal4py.ridge_regression_prediction_result attribute)": [[0, "daal4py.ridge_regression_prediction_result.prediction"]], "prediction (daal4py.stump_regression_prediction_result attribute)": [[0, "daal4py.stump_regression_prediction_result.prediction"]], "probabilities (daal4py.classifier_prediction_result attribute)": [[0, "daal4py.classifier_prediction_result.probabilities"], [0, "id11"], [0, "id15"], [0, "id19"], [0, "id23"], [0, "id27"], [0, "id3"], [0, "id31"], [0, "id35"], [0, "id39"], [0, "id43"], [0, "id7"]], "qr (class in daal4py)": [[0, "daal4py.qr"]], "qr_result (class in daal4py)": [[0, "daal4py.qr_result"]], "quantiles (class in daal4py)": [[0, "daal4py.quantiles"]], "quantiles (daal4py.quantiles_result attribute)": [[0, "daal4py.quantiles_result.quantiles"]], "quantiles_result (class in daal4py)": [[0, "daal4py.quantiles_result"]], "randomnumbers (daal4py.engines_result attribute)": [[0, "daal4py.engines_result.randomNumbers"]], "ridge_regression_model (class in daal4py)": [[0, "daal4py.ridge_regression_model"]], "ridge_regression_prediction (class in daal4py)": [[0, "daal4py.ridge_regression_prediction"]], "ridge_regression_prediction_result (class in daal4py)": [[0, "daal4py.ridge_regression_prediction_result"]], "ridge_regression_training (class in daal4py)": [[0, "daal4py.ridge_regression_training"]], "ridge_regression_training_result (class in daal4py)": [[0, "daal4py.ridge_regression_training_result"]], "rightsingularmatrix (daal4py.svd_result attribute)": [[0, "daal4py.svd_result.rightSingularMatrix"]], "secondorderrawmoment (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.secondOrderRawMoment"]], "setup() (daal4py.optimization_solver_cross_entropy_loss method)": [[0, "daal4py.optimization_solver_cross_entropy_loss.setup"]], "setup() (daal4py.optimization_solver_logistic_loss method)": [[0, "daal4py.optimization_solver_logistic_loss.setup"]], "setup() (daal4py.optimization_solver_mse method)": [[0, "daal4py.optimization_solver_mse.setup"]], "singularvalues (daal4py.svd_result attribute)": [[0, "daal4py.svd_result.singularValues"]], "sorteddata (daal4py.sorting_result attribute)": [[0, "daal4py.sorting_result.sortedData"]], "sorting (class in daal4py)": [[0, "daal4py.sorting"]], "sorting_result (class in daal4py)": [[0, "daal4py.sorting_result"]], "standarddeviation (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.standardDeviation"]], "stump_classification_model (class in daal4py)": [[0, "daal4py.stump_classification_model"]], "stump_classification_prediction (class in daal4py)": [[0, "daal4py.stump_classification_prediction"]], "stump_classification_training (class in daal4py)": [[0, "daal4py.stump_classification_training"]], "stump_classification_training_result (class in daal4py)": [[0, "daal4py.stump_classification_training_result"]], "stump_regression_model (class in daal4py)": [[0, "daal4py.stump_regression_model"]], "stump_regression_prediction (class in daal4py)": [[0, "daal4py.stump_regression_prediction"]], "stump_regression_prediction_result (class in daal4py)": [[0, "daal4py.stump_regression_prediction_result"]], "stump_regression_training (class in daal4py)": [[0, "daal4py.stump_regression_training"]], "stump_regression_training_result (class in daal4py)": [[0, "daal4py.stump_regression_training_result"]], "sum (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.sum"]], "sumsquares (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.sumSquares"]], "sumsquarescentered (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.sumSquaresCentered"]], "svd (class in daal4py)": [[0, "daal4py.svd"]], "svd_result (class in daal4py)": [[0, "daal4py.svd_result"]], "svm_model (class in daal4py)": [[0, "daal4py.svm_model"]], "svm_prediction (class in daal4py)": [[0, "daal4py.svm_prediction"]], "svm_training (class in daal4py)": [[0, "daal4py.svm_training"]], "svm_training_result (class in daal4py)": [[0, "daal4py.svm_training_result"]], "transformeddata (daal4py.pca_transform_result attribute)": [[0, "daal4py.pca_transform_result.transformedData"]], "univariate_outlier_detection (class in daal4py)": [[0, "daal4py.univariate_outlier_detection"]], "univariate_outlier_detection_result (class in daal4py)": [[0, "daal4py.univariate_outlier_detection_result"]], "variableimportance (daal4py.decision_forest_classification_training_result attribute)": [[0, "daal4py.decision_forest_classification_training_result.variableImportance"]], "variableimportance (daal4py.decision_forest_regression_training_result attribute)": [[0, "daal4py.decision_forest_regression_training_result.variableImportance"]], "variableimportance (daal4py.stump_classification_training_result attribute)": [[0, "daal4py.stump_classification_training_result.variableImportance"]], "variableimportance (daal4py.stump_regression_training_result attribute)": [[0, "daal4py.stump_regression_training_result.variableImportance"]], "variableimportancebycover (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.variableImportanceByCover"]], "variableimportancebycover (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.variableImportanceByCover"]], "variableimportancebygain (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.variableImportanceByGain"]], "variableimportancebygain (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.variableImportanceByGain"]], "variableimportancebytotalcover (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.variableImportanceByTotalCover"]], "variableimportancebytotalcover (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.variableImportanceByTotalCover"]], "variableimportancebytotalgain (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.variableImportanceByTotalGain"]], "variableimportancebytotalgain (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.variableImportanceByTotalGain"]], "variableimportancebyweight (daal4py.gbt_classification_training_result attribute)": [[0, "daal4py.gbt_classification_training_result.variableImportanceByWeight"]], "variableimportancebyweight (daal4py.gbt_regression_training_result attribute)": [[0, "daal4py.gbt_regression_training_result.variableImportanceByWeight"]], "variance (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.variance"]], "variances (daal4py.normalization_zscore_result attribute)": [[0, "daal4py.normalization_zscore_result.variances"]], "variances (daal4py.pca_result attribute)": [[0, "daal4py.pca_result.variances"]], "variation (daal4py.low_order_moments_result attribute)": [[0, "daal4py.low_order_moments_result.variation"]], "weaklearnerserrors (daal4py.adaboost_training_result attribute)": [[0, "daal4py.adaboost_training_result.weakLearnersErrors"]], "weights (daal4py.bacon_outlier_detection_result attribute)": [[0, "daal4py.bacon_outlier_detection_result.weights"]], "weights (daal4py.em_gmm_init_result attribute)": [[0, "daal4py.em_gmm_init_result.weights"]], "weights (daal4py.em_gmm_result attribute)": [[0, "daal4py.em_gmm_result.weights"]], "weights (daal4py.multivariate_outlier_detection_result attribute)": [[0, "daal4py.multivariate_outlier_detection_result.weights"]], "weights (daal4py.univariate_outlier_detection_result attribute)": [[0, "daal4py.univariate_outlier_detection_result.weights"]]}}) - diff --git a/daal4py/sklearn.html b/daal4py/sklearn.html old mode 100755 new mode 100644 index 0a39506..6d8d192 --- a/daal4py/sklearn.html +++ b/daal4py/sklearn.html @@ -1,367 +1,15 @@ - + - - - -Python interface to efficient Intel(R) oneAPI Data Analytics Library provided by daal4py allows one -to create scikit-learn compatible estimators, transformers, clusterers, etc. powered by oneDAL which -are nearly as efficient as native programs.
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate -package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. -Please use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-daal4py can dynamically patch scikit-learn estimators to use Intel(R) oneAPI Data Analytics Library -as the underlying solver, while getting the same solution faster.
-It is possible to enable those patches without editing the code of a scikit-learn application by -using the following commandline flag:
-python -m daal4py my_application.py
-If you are using Scikit-Learn from Intel® Distribution for Python, then
-you can enable daal4py patches through an environment variable. To do this, set USE_DAAL4PY_SKLEARN to one of the values
-True, '1', 'y', 'yes', 'Y', 'YES', 'Yes', 'true', 'True' or 'TRUE' as shown below.
On Linux and Mac OS:
-export USE_DAAL4PY_SKLEARN=1
-On Windows:
-set USE_DAAL4PY_SKLEARN=1
-To disable daal4py patches, set the USE_DAAL4PY_SKLEARN environment variable to 0.
Patches can also be enabled programmatically:
-import daal4py.sklearn
-daal4py.sklearn.patch_sklearn()
-It is possible to undo the patch with:
-daal4py.sklearn.unpatch_sklearn()
-Applying the monkey patch will impact the following existing scikit-learn -algorithms:
-Task |
-Functionality |
-Parameters support |
-Data support |
-
|---|---|---|---|
Classification |
-SVC |
-All parameters except |
-No limitations. |
-
Classification |
-RandomForestClassifier |
-All parameters except |
-Multi-output, sparse data and out-of-bag score are not supported. |
-
Classification |
-KNeighborsClassifier |
-All parameters except |
-Multi-output and sparse data is not supported. |
-
Classification |
-LogisticRegression |
-All parameters except |
-Only dense data is supported. |
-
Regression |
-RandomForestRegressor |
-All parameters except |
-Multi-output, sparse data and out-of-bag score are not supported. |
-
Regression |
-KNeighborsRegressor |
-All parameters except |
-Multi-output and sparse data is not supported. |
-
Regression |
-LinearRegression |
-All parameters except |
-Only dense data is supported, #observations should be >= #features. |
-
Regression |
-Ridge |
-All parameters except |
-Only dense data is supported, #observations should be >= #features. |
-
Regression |
-ElasticNet |
-All parameters except |
-Multi-output and sparse data is not supported, #observations should be >= #features. |
-
Regression |
-Lasso |
-All parameters except |
-Multi-output and sparse data is not supported, #observations should be >= #features. |
-
Clustering |
-KMeans |
-All parameters except |
-No limitations. |
-
Clustering |
-DBSCAN |
-All parameters except |
-Only dense data is supported. |
-
Dimensionality reduction |
-PCA |
-All parameters except |
-Sparse data is not supported. |
-
Unsupervised |
-NearestNeighbors |
-All parameters except |
-Sparse data is not supported. |
-
Other |
-train_test_split |
-All parameters are supported. |
-Only dense data is supported. |
-
Other |
-assert_all_finite |
-All parameters are supported. |
-Only dense data is supported. |
-
Other |
-pairwise_distance |
-With metric=``cosine`` and |
-Only dense data is supported. |
-
Other |
-roc_auc_score |
-Parameters |
-No limitations. |
-
Monkey-patched scikit-learn classes and functions passes scikit-learn’s own test -suite, with few exceptions, specified in deselected_tests.yaml.
-In particular the tests execute check_estimator -on all added and monkey-patched classes, which are discovered by means of -introspection. This assures scikit-learn API compatibility of all -daal4py.sklearn classes.
-Note
-daal4py supports optimizations for the last four versions of scikit-learn. -The latest release of daal4py-2021.1 supports scikit-learn 0.21.X, 0.22.X, 0.23.X and 0.24.X.
-To find out which implementation of the algorithm is currently used, -set the environment variable.
-On Linux and Mac OS:
-export IDP_SKLEARN_VERBOSE=INFO
-On Windows:
-set IDP_SKLEARN_VERBOSE=INFO
-During the calls that use Intel-optimized scikit-learn, you will receive additional print statements -that indicate which implementation is being called. -These print statements are only available for scikit-learn algorithms with daal4py patches.
-For example, for DBSCAN you get one of these print statements depending on which implementation is used:
-INFO: sklearn.cluster.DBSCAN.fit: running accelerated version on CPU
-INFO: sklearn.cluster.DBSCAN.fit: fallback to original Scikit-learn
-The daal4py.sklearn package contains scikit-learn compatible API which
-implement a subset of scikit-learn algorithms using Intel(R) oneAPI Data Analytics Library.
Currently, these include:
-daal4py.sklearn.neighbors.KNeighborsClassifier
daal4py.sklearn.neighbors.KNeighborsRegressor
daal4py.sklearn.neighbors.NearestNeighbors
daal4py.sklearn.tree.DecisionTreeClassifier
daal4py.sklearn.ensemble.RandomForestClassifier
daal4py.sklearn.ensemble.RandomForestRegressor
daal4py.sklearn.ensemble.AdaBoostClassifier
daal4py.sklearn.cluster.KMeans
daal4py.sklearn.cluster.DBSCAN
daal4py.sklearn.decomposition.PCA
daal4py.sklearn.linear_model.Ridge
daal4py.sklearn.svm.SVC
daal4py.sklearn.linear_model.logistic_regression_path
daal4py.sklearn.linear_model.LogisticRegression
daal4py.sklearn.linear_model.ElasticNet
daal4py.sklearn.linear_model.Lasso
daal4py.sklearn.model_selection._daal_train_test_split
daal4py.sklearn.metrics._daal_roc_auc_score
These classes are always available, whether the scikit-learn itself has been -patched, or not. For example:
-import daal4py.sklearn
-daal4py.sklearn.unpatch_sklearn()
-import sklearn.datasets, sklearn.svm
-
-digits = sklearn.datasets.load_digits()
-X, y = digits.data, digits.target
-
-clf_d = daal4py.sklearn.svm.SVC(kernel='rbf', gamma='scale', C = 0.5).fit(X, y)
-clf_v = sklearn.svm.SVC(kernel='rbf', gamma='scale', C =0.5).fit(X, y)
-
-clf_d.score(X, y) # output: 0.9905397885364496
-clf_v.score(X, y) # output: 0.9905397885364496
-The scikit-learn integration documentation has moved. You should be redirected automatically. If not, please visit:
+Patching Utilities for scikit-learn
+Note: Use sklearnex for scikit-learn acceleration. daal4py sklearn module is deprecated.
- \ No newline at end of file + diff --git a/daal4py/streaming.html b/daal4py/streaming.html old mode 100755 new mode 100644 index 1a253f7..d109918 --- a/daal4py/streaming.html +++ b/daal4py/streaming.html @@ -1,217 +1,14 @@ - + - - - -Note
-Scikit-learn patching functionality in daal4py was deprecated and moved to a separate package, Intel(R) Extension for Scikit-learn*. -All future patches will be available only in Intel(R) Extension for Scikit-learn*. Use the scikit-learn-intelex package instead of daal4py for the scikit-learn acceleration.
-For large quantities of data it might be impossible to provide all input data at -once. This might be because the data resides in multiple files and merging it is -to costly (or not feasible in other ways). In other cases the data is simply too -large to be loaded completely into memory. Or, the data might come in as an -actual stream. daal4py’s streaming mode allows you to process such data.
-Besides supporting certain use cases, streaming also allows interleaving I/O -operations with computation.
-daal4py’s streaming mode is as easy as follows:
-When constructing the algorithm configure it with streaming=True:
algo = daal4py.svd(streaming=True)
-Repeat calling compute(input-data) with chunks of your input (arrays, DataFrames or
-files):
for f in input_files:
- algo.compute(f)
-When done with inputting, call finalize() to obtain the result:
result = algo.finalize()
-The streaming algorithms also accept arrays and DataFrames as input, e.g. the -data can come from a stream rather than from multiple files. Here is an example -which simulates a data stream using a generator which reads a file in chunks: -SVD reading stream of data
-The following algorithms support streaming:
-SVD (svd)
-Linear Regression Training (linear_regression_training)
- -Ridge Regression Training (ridge_regression_training)
- -Multinomial Naive Bayes Training (multinomial_naive_bayes_training)
-Moments of Low Order
- -Covariance
-QR
-The streaming mode documentation has moved. You should be redirected automatically. If not, please visit:
+ - \ No newline at end of file +