package sklearn

You can search for identifiers within the package.

in-package search v0.2.0

package sklearn

sklearn
- Library sklearn
  - Sklearn
    
    Arr
    
    List
    
    Dtype
    
    Ops
    
    Float
    
    Int
    
    String
    
    Object
    
    Base
    
    BaseEstimator
    
    BiclusterMixin
    
    ClassifierMixin
    
    ClusterMixin
    
    DensityMixin
    
    MetaEstimatorMixin
    
    MultiOutputMixin
    
    OutlierMixin
    
    RegressorMixin
    
    TransformerMixin
    
    Calibration
    
    BaseEstimator
    
    CalibratedClassifierCV
    
    ClassifierMixin
    
    IsotonicRegression
    
    LabelBinarizer
    
    LabelEncoder
    
    LinearSVC
    
    MetaEstimatorMixin
    
    RegressorMixin
    
    Cluster
    
    AffinityPropagation
    
    AgglomerativeClustering
    
    Birch
    
    DBSCAN
    
    FeatureAgglomeration
    
    KMeans
    
    MeanShift
    
    MiniBatchKMeans
    
    OPTICS
    
    SpectralBiclustering
    
    SpectralClustering
    
    SpectralCoclustering
    
    Compose
    
    ColumnTransformer
    
    TransformedTargetRegressor
    
    Make_column_selector
    
    Conftest
    
    Covariance
    
    EllipticEnvelope
    
    EmpiricalCovariance
    
    GraphicalLasso
    
    GraphicalLassoCV
    
    LedoitWolf
    
    MinCovDet
    
    OAS
    
    ShrunkCovariance
    
    Cross_decomposition
    
    CCA
    
    PLSCanonical
    
    PLSRegression
    
    PLSSVD
    
    Csr_matrix
    
    Datasets
    
    Decomposition
    
    DictionaryLearning
    
    FactorAnalysis
    
    FastICA
    
    IncrementalPCA
    
    KernelPCA
    
    LatentDirichletAllocation
    
    PCA
    
    SparseCoder
    
    SparsePCA
    
    TruncatedSVD
    
    Dict
    
    BUILD
    
    Discriminant_analysis
    
    BaseEstimator
    
    ClassifierMixin
    
    LinearClassifierMixin
    
    LinearDiscriminantAnalysis
    
    QuadraticDiscriminantAnalysis
    
    StandardScaler
    
    TransformerMixin
    
    Dummy
    
    BaseEstimator
    
    ClassifierMixin
    
    DummyClassifier
    
    DummyRegressor
    
    MultiOutputMixin
    
    RegressorMixin
    
    Deprecated
    
    Ensemble
    
    AdaBoostClassifier
    
    AdaBoostRegressor
    
    BaggingClassifier
    
    BaggingRegressor
    
    ExtraTreesClassifier
    
    ExtraTreesRegressor
    
    GradientBoostingClassifier
    
    GradientBoostingRegressor
    
    IsolationForest
    
    RandomForestClassifier
    
    RandomForestRegressor
    
    RandomTreesEmbedding
    
    StackingClassifier
    
    StackingRegressor
    
    VotingClassifier
    
    VotingRegressor
    
    Partial_dependence
    
    Parallel
    
    Deprecated
    
    Exceptions
    
    Experimental
    
    Externals
    
    Feature_extraction
    
    DictVectorizer
    
    FeatureHasher
    
    Image
    
    BaseEstimator
    
    PatchExtractor
    
    Deprecated
    
    Text
    
    BaseEstimator
    
    CountVectorizer
    
    FeatureHasher
    
    HashingVectorizer
    
    TfidfTransformer
    
    TfidfVectorizer
    
    TransformerMixin
    
    Deprecated
    
    Feature_selection
    
    GenericUnivariateSelect
    
    RFE
    
    RFECV
    
    SelectFdr
    
    SelectFpr
    
    SelectFromModel
    
    SelectFwe
    
    SelectKBest
    
    SelectPercentile
    
    VarianceThreshold
    
    Gaussian_process
    
    GaussianProcessClassifier
    
    GaussianProcessRegressor
    
    Kernels
    
    ABCMeta
    
    CompoundKernel
    
    ConstantKernel
    
    DotProduct
    
    ExpSineSquared
    
    Exponentiation
    
    GenericKernelMixin
    
    Hyperparameter
    
    Matern
    
    NormalizedKernelMixin
    
    PairwiseKernel
    
    Product
    
    RBF
    
    RationalQuadratic
    
    StationaryKernelMixin
    
    Sum
    
    WhiteKernel
    
    Impute
    
    KNNImputer
    
    MissingIndicator
    
    SimpleImputer
    
    Inspection
    
    PartialDependenceDisplay
    
    Isotonic
    
    BaseEstimator
    
    IsotonicRegression
    
    RegressorMixin
    
    TransformerMixin
    
    Kernel_approximation
    
    AdditiveChi2Sampler
    
    BaseEstimator
    
    Nystroem
    
    RBFSampler
    
    SkewedChi2Sampler
    
    TransformerMixin
    
    Kernel_ridge
    
    BaseEstimator
    
    KernelRidge
    
    MultiOutputMixin
    
    RegressorMixin
    
    Linear_model
    
    ARDRegression
    
    BayesianRidge
    
    ElasticNet
    
    ElasticNetCV
    
    HuberRegressor
    
    Lars
    
    LarsCV
    
    Lasso
    
    LassoCV
    
    LassoLars
    
    LassoLarsCV
    
    LassoLarsIC
    
    LinearRegression
    
    LogisticRegression
    
    LogisticRegressionCV
    
    MultiTaskElasticNet
    
    MultiTaskElasticNetCV
    
    MultiTaskLasso
    
    MultiTaskLassoCV
    
    OrthogonalMatchingPursuit
    
    OrthogonalMatchingPursuitCV
    
    RANSACRegressor
    
    Ridge
    
    RidgeCV
    
    RidgeClassifier
    
    RidgeClassifierCV
    
    TheilSenRegressor
    
    Manifold
    
    Isomap
    
    LocallyLinearEmbedding
    
    MDS
    
    SpectralEmbedding
    
    TSNE
    
    Metrics
    
    ConfusionMatrixDisplay
    
    PrecisionRecallDisplay
    
    RocCurveDisplay
    
    Cluster
    
    Pairwise
    
    Parallel
    
    Mixture
    
    BayesianGaussianMixture
    
    GaussianMixture
    
    Model_selection
    
    GridSearchCV
    
    GroupShuffleSplit
    
    LeaveOneGroupOut
    
    LeaveOneOut
    
    LeavePGroupsOut
    
    LeavePOut
    
    ParameterGrid
    
    ParameterSampler
    
    PredefinedSplit
    
    RandomizedSearchCV
    
    RepeatedKFold
    
    RepeatedStratifiedKFold
    
    ShuffleSplit
    
    StratifiedShuffleSplit
    
    Multiclass
    
    BaseEstimator
    
    ClassifierMixin
    
    LabelBinarizer
    
    MetaEstimatorMixin
    
    MultiOutputMixin
    
    OneVsOneClassifier
    
    OneVsRestClassifier
    
    OutputCodeClassifier
    
    Parallel
    
    Multioutput
    
    ABCMeta
    
    BaseEstimator
    
    ClassifierChain
    
    ClassifierMixin
    
    MetaEstimatorMixin
    
    MultiOutputClassifier
    
    MultiOutputRegressor
    
    Parallel
    
    RegressorChain
    
    RegressorMixin
    
    Deprecated
    
    Naive_bayes
    
    ABCMeta
    
    BaseEstimator
    
    BernoulliNB
    
    CategoricalNB
    
    ClassifierMixin
    
    ComplementNB
    
    GaussianNB
    
    LabelBinarizer
    
    MultinomialNB
    
    Deprecated
    
    Ndarray
    
    Dtype
    
    Ops
    
    List
    
    Float
    
    Int
    
    String
    
    Object
    
    Ndarray_private
    
    Neighbors
    
    KNeighborsClassifier
    
    KNeighborsRegressor
    
    KNeighborsTransformer
    
    KernelDensity
    
    LocalOutlierFactor
    
    NearestCentroid
    
    NearestNeighbors
    
    NeighborhoodComponentsAnalysis
    
    RadiusNeighborsClassifier
    
    RadiusNeighborsRegressor
    
    RadiusNeighborsTransformer
    
    Neural_network
    
    BernoulliRBM
    
    Pipeline
    
    Bunch
    
    FeatureUnion
    
    Parallel
    
    Pipeline
    
    TransformerMixin
    
    Preprocessing
    
    Binarizer
    
    FunctionTransformer
    
    KBinsDiscretizer
    
    KernelCenterer
    
    LabelBinarizer
    
    LabelEncoder
    
    MaxAbsScaler
    
    MinMaxScaler
    
    MultiLabelBinarizer
    
    Normalizer
    
    OneHotEncoder
    
    OrdinalEncoder
    
    PolynomialFeatures
    
    PowerTransformer
    
    QuantileTransformer
    
    RobustScaler
    
    StandardScaler
    
    PyList
    
    ELEMENT
    
    S
    
    Make
    
    Random_projection
    
    ABCMeta
    
    BaseEstimator
    
    GaussianRandomProjection
    
    SparseRandomProjection
    
    TransformerMixin
    
    Deprecated
    
    Semi_supervised
    
    LabelPropagation
    
    LabelSpreading
    
    Setup
    
    Svm
    
    LinearSVC
    
    LinearSVR
    
    NuSVC
    
    NuSVR
    
    OneClassSVM
    
    SVC
    
    SVR
    
    Tests
    
    Tree
    
    DecisionTreeClassifier
    
    DecisionTreeRegressor
    
    ExtraTreeClassifier
    
    ExtraTreeRegressor
    
    Utils
    
    Bunch
    
    Path
    
    Arrayfuncs
    
    Class_weight
    
    Deprecated
    
    Deprecation
    
    Deprecated
    
    Extmath
    
    Deprecated
    
    Fixes
    
    LooseVersion
    
    MaskedArray
    
    Graph
    
    Graph_shortest_path
    
    Float64
    
    Metaestimators
    
    ABCMeta
    
    BaseEstimator
    
    Multiclass
    
    Dok_matrix
    
    Lil_matrix
    
    Spmatrix
    
    Murmurhash
    
    Optimize
    
    Deprecated
    
    Parallel_backend
    
    Random
    
    Deprecated
    
    Sparsefuncs
    
    Sparsefuncs_fast
    
    Stats
    
    Validation
    
    LooseVersion
    
    Parameter
    
    Version
    
    Wrap_utils
    
    Option
    
    Slice
- Sources
  - sklearn
    
    PyList.ml
    
    arr.ml
    
    base.ml
    
    calibration.ml
    
    cluster.ml
    
    compose.ml
    
    conftest.ml
    
    covariance.ml
    
    cross_decomposition.ml
    
    csr_matrix.ml
    
    datasets.ml
    
    decomposition.ml
    
    dict.ml
    
    discriminant_analysis.ml
    
    dummy.ml
    
    ensemble.ml
    
    exceptions.ml
    
    experimental.ml
    
    externals.ml
    
    feature_extraction.ml
    
    feature_selection.ml
    
    gaussian_process.ml
    
    impute.ml
    
    inspection.ml
    
    isotonic.ml
    
    kernel_approximation.ml
    
    kernel_ridge.ml
    
    linear_model.ml
    
    manifold.ml
    
    metrics.ml
    
    mixture.ml
    
    model_selection.ml
    
    multiclass.ml
    
    multioutput.ml
    
    naive_bayes.ml
    
    ndarray.ml
    
    neighbors.ml
    
    neural_network.ml
    
    pipeline.ml
    
    preprocessing.ml
    
    random_projection.ml
    
    semi_supervised.ml
    
    setup.ml
    
    sklearn.ml
    
    svm.ml
    
    tests.ml
    
    tree.ml
    
    utils.ml
    
    version.ml
    
    wrap_utils.ml

Legend:
Page
Library
Module
Module type
Parameter
Class
Class type
Source

Module `Naive_bayes.MultinomialNB`Source

Sourcetype t

Sourceval of_pyobject : Py.Object.t -> t

Sourceval to_pyobject : t -> Py.Object.t

Source

val create : 
  ?alpha:float ->
  ?fit_prior:bool ->
  ?class_prior:[ `Arr of Arr.t | `PyObject of Py.Object.t ] ->
  unit ->
  t

Naive Bayes classifier for multinomial models

The multinomial Naive Bayes classifier is suitable for classification with discrete features (e.g., word counts for text classification). The multinomial distribution normally requires integer feature counts. However, in practice, fractional counts such as tf-idf may also work.

Read more in the :ref:`User Guide <multinomial_naive_bayes>`.

Parameters ---------- alpha : float, optional (default=1.0) Additive (Laplace/Lidstone) smoothing parameter (0 for no smoothing).

fit_prior : boolean, optional (default=True) Whether to learn class prior probabilities or not. If false, a uniform prior will be used.

class_prior : array-like, size (n_classes,), optional (default=None) Prior probabilities of the classes. If specified the priors are not adjusted according to the data.

Attributes ---------- class_count_ : array, shape (n_classes,) Number of samples encountered for each class during fitting. This value is weighted by the sample weight when provided.

class_log_prior_ : array, shape (n_classes, ) Smoothed empirical log probability for each class.

classes_ : array, shape (n_classes,) Class labels known to the classifier

coef_ : array, shape (n_classes, n_features) Mirrors ``feature_log_prob_`` for interpreting MultinomialNB as a linear model.

feature_count_ : array, shape (n_classes, n_features) Number of samples encountered for each (class, feature) during fitting. This value is weighted by the sample weight when provided.

feature_log_prob_ : array, shape (n_classes, n_features) Empirical log probability of features given a class, ``P(x_i|y)``.

intercept_ : array, shape (n_classes, ) Mirrors ``class_log_prior_`` for interpreting MultinomialNB as a linear model.

n_features_ : int Number of features of each sample.

Examples -------- >>> import numpy as np >>> rng = np.random.RandomState(1) >>> X = rng.randint(5, size=(6, 100)) >>> y = np.array(1, 2, 3, 4, 5, 6) >>> from sklearn.naive_bayes import MultinomialNB >>> clf = MultinomialNB() >>> clf.fit(X, y) MultinomialNB() >>> print(clf.predict(X2:3)) 3

Notes ----- For the rationale behind the names `coef_` and `intercept_`, i.e. naive Bayes as a linear classifier, see J. Rennie et al. (2003), Tackling the poor assumptions of naive Bayes text classifiers, ICML.

References ---------- C.D. Manning, P. Raghavan and H. Schuetze (2008). Introduction to Information Retrieval. Cambridge University Press, pp. 234-265. https://nlp.stanford.edu/IR-book/html/htmledition/naive-bayes-text-classification-1.html

Sourceval fit : ?sample_weight:Arr.t -> x:Arr.t -> y:Arr.t -> t -> t

Fit Naive Bayes classifier according to X, y

Parameters ---------- X : array-like, sparse matrix of shape (n_samples, n_features) Training vectors, where n_samples is the number of samples and n_features is the number of features.

y : array-like of shape (n_samples,) Target values.

sample_weight : array-like of shape (n_samples,), default=None Weights applied to individual samples (1. for unweighted).

Returns ------- self : object

Sourceval get_params : ?deep:bool -> t -> Dict.t

Get parameters for this estimator.

Parameters ---------- deep : bool, default=True If True, will return the parameters for this estimator and contained subobjects that are estimators.

Returns ------- params : mapping of string to any Parameter names mapped to their values.

Source

val partial_fit : 
  ?classes:Arr.t ->
  ?sample_weight:Arr.t ->
  x:Arr.t ->
  y:Arr.t ->
  t ->
  t

Incremental fit on a batch of samples.

This method is expected to be called several times consecutively on different chunks of a dataset so as to implement out-of-core or online learning.

This is especially useful when the whole dataset is too big to fit in memory at once.

This method has some performance overhead hence it is better to call partial_fit on chunks of data that are as large as possible (as long as fitting in the memory budget) to hide the overhead.

Parameters ---------- X : array-like, sparse matrix of shape (n_samples, n_features) Training vectors, where n_samples is the number of samples and n_features is the number of features.

y : array-like of shape (n_samples,) Target values.

classes : array-like of shape (n_classes) (default=None) List of all the classes that can possibly appear in the y vector.

Must be provided at the first call to partial_fit, can be omitted in subsequent calls.

sample_weight : array-like of shape (n_samples,), default=None Weights applied to individual samples (1. for unweighted).

Returns ------- self : object

Sourceval predict : x:Arr.t -> t -> Arr.t

Perform classification on an array of test vectors X.

Parameters ---------- X : array-like of shape (n_samples, n_features)

Returns ------- C : ndarray of shape (n_samples,) Predicted target values for X

Sourceval predict_log_proba : x:Arr.t -> t -> Arr.t

Return log-probability estimates for the test vector X.

Parameters ---------- X : array-like of shape (n_samples, n_features)

Returns ------- C : array-like of shape (n_samples, n_classes) Returns the log-probability of the samples for each class in the model. The columns correspond to the classes in sorted order, as they appear in the attribute :term:`classes_`.

Sourceval predict_proba : x:Arr.t -> t -> Arr.t

Return probability estimates for the test vector X.

Parameters ---------- X : array-like of shape (n_samples, n_features)

Returns ------- C : array-like of shape (n_samples, n_classes) Returns the probability of the samples for each class in the model. The columns correspond to the classes in sorted order, as they appear in the attribute :term:`classes_`.

Sourceval score : ?sample_weight:Arr.t -> x:Arr.t -> y:Arr.t -> t -> float

Return the mean accuracy on the given test data and labels.

In multi-label classification, this is the subset accuracy which is a harsh metric since you require for each sample that each label set be correctly predicted.

Parameters ---------- X : array-like of shape (n_samples, n_features) Test samples.

y : array-like of shape (n_samples,) or (n_samples, n_outputs) True labels for X.

sample_weight : array-like of shape (n_samples,), default=None Sample weights.

Returns ------- score : float Mean accuracy of self.predict(X) wrt. y.

Sourceval set_params : ?params:(string * Py.Object.t) list -> t -> t

Set the parameters of this estimator.

The method works on simple estimators as well as on nested objects (such as pipelines). The latter have parameters of the form ``<component>__<parameter>`` so that it's possible to update each component of a nested object.

Parameters ---------- **params : dict Estimator parameters.

Returns ------- self : object Estimator instance.

Sourceval class_count_ : t -> Arr.t

Attribute class_count_: get value or raise Not_found if None.

Sourceval class_count_opt : t -> Arr.t option

Attribute class_count_: get value as an option.

Sourceval class_log_prior_ : t -> Arr.t

Attribute class_log_prior_: get value or raise Not_found if None.

Sourceval class_log_prior_opt : t -> Arr.t option

Attribute class_log_prior_: get value as an option.

Sourceval classes_ : t -> Arr.t

Attribute classes_: get value or raise Not_found if None.

Sourceval classes_opt : t -> Arr.t option

Attribute classes_: get value as an option.

Sourceval coef_ : t -> Arr.t

Attribute coef_: get value or raise Not_found if None.

Sourceval coef_opt : t -> Arr.t option

Attribute coef_: get value as an option.

Sourceval feature_count_ : t -> Arr.t

Attribute feature_count_: get value or raise Not_found if None.

Sourceval feature_count_opt : t -> Arr.t option

Attribute feature_count_: get value as an option.

Sourceval feature_log_prob_ : t -> Arr.t

Attribute feature_log_prob_: get value or raise Not_found if None.

Sourceval feature_log_prob_opt : t -> Arr.t option

Attribute feature_log_prob_: get value as an option.

Sourceval intercept_ : t -> Arr.t

Attribute intercept_: get value or raise Not_found if None.

Sourceval intercept_opt : t -> Arr.t option

Attribute intercept_: get value as an option.

Sourceval n_features_ : t -> int

Attribute n_features_: get value or raise Not_found if None.

Sourceval n_features_opt : t -> int option

Attribute n_features_: get value as an option.

Sourceval to_string : t -> string

Print the object to a human-readable representation.

Sourceval show : t -> string

Print the object to a human-readable representation.

Sourceval pp : Format.formatter -> t -> unit

Pretty-print the object to a formatter.

package sklearn

Module Naive_bayes.MultinomialNBSource

Module `Naive_bayes.MultinomialNB`Source