decision tree

# Create Decision Tree classifer object
clf = DecisionTreeClassifier(criterion="entropy", max_depth=3)

# Train Decision Tree Classifer
clf = clf.fit(X_train,y_train)

#Predict the response for test dataset
y_pred = clf.predict(X_test)

# Model Accuracy, how often is the classifier correct?
print("Accuracy:",metrics.accuracy_score(y_test, y_pred))

View another examples Add Own solution

Xawery Wiśniowiecki 90 points

                                    from sklearn.datasets import load_iris
&gt;&gt;&gt; from sklearn import tree
&gt;&gt;&gt; X, y = load_iris(return_X_y=True)
&gt;&gt;&gt; clf = tree.DecisionTreeClassifier()
&gt;&gt;&gt; clf = clf.fit(X, y)

Thank you! 2

5 (2 Votes)

Radu C. Serban 95 points

                                    # Decision tree learning algorithm for classification

from pyspark.ml.linalg import Vectors
from pyspark.ml.feature import StringIndexer
df = spark.createDataFrame([
  (1.0, Vectors.dense(1.0)),
  (0.0, Vectors.sparse(1, [], []))], [&quot;label&quot;, &quot;features&quot;])
stringIndexer = StringIndexer(inputCol=&quot;label&quot;, outputCol=&quot;indexed&quot;)
si_model = stringIndexer.fit(df)
td = si_model.transform(df)
dt = DecisionTreeClassifier(maxDepth=2, labelCol=&quot;indexed&quot;)
model = dt.fit(td)
model.numNodes
# 3
model.depth
# 1
model.featuresImportances
# SparseVector(1, {0: 1.0})
model.numFeatures
# 1
model.numClasses
# 2
print(model.toDebugString)
# DecisionTreeClassificationModel (uid=...) of depth 1 with 3 nodes...
test0 = spark.createDataFrame([(Vectors.dense(-1.0),)], [&quot;features&quot;])
result = model.transform(test0).head()
result.prediction
# 0.0
result.probability
# DenseVectors([1.0, 0.0])
result.rawPrediction
# DenseVector([1.0, 0.0])
test1 = spark.createDataFrame([Vectors.sparse(1, [0], [1.0]),)], [&quot;features&quot;])
model.transform(test1).head().prediction
# 1.0

dtc_path = temp_path + &quot;/dtc&quot;
dt.save(dtc_path)
dt2 = DecisionTreeClassifier.load(dtc_path)
dt2.getMaxDepth()
# 2
model_path = temp_path + &quot;/dtc_model&quot;
model.save(model_path)
model2 = DecisionTreeClassificationModel.load(model_path)
model.featureImportances == model2.featureImportances
# True

Thank you! 0

3.8

Blanka 100 points

                                    from sklearn.datasets import load_iris
from sklearn.model_selection import cross_val_score
from sklearn.tree import DecisionTreeClassifier
clf = DecisionTreeClassifier(random_state=0)
iris = load_iris()
cross_val_score(clf, iris.data, iris.target, cv=10)

Thank you! 5

3.8 (5 Votes)

Sam Friedman 90 points

                                    from sklearn.datasets import load_iris
&gt;&gt;&gt; from sklearn import tree
&gt;&gt;&gt; X, y = load_iris(return_X_y=True)
&gt;&gt;&gt; clf = tree.DecisionTreeClassifier()
&gt;&gt;&gt; clf = clf.fit(X, y)

Thank you! 6

4 (6 Votes)

Jenovachild 75 points

                                    # Decision tree learning algorithm for regression

from pyspark.ml.linalg import Vectors
df = spark.createDataFrame([
  (1.0, Vectors.dense(1.0)),
  (0.0, Vectors.sparse(1, [], []))], [&quot;label&quot;, &quot;features&quot;])
dt = DecisionTreeRegressor(maxDepth=2, varianceCol=&quot;variance&quot;)
model = dt.fit(df)
model.depth
# 1
model.numNodes
# 3
model.featureImportances
# SparseVector(1, {0: 1.0}
model.numFeatures
# 1
test0 = spark.createDataFrame([(Vectors.dense(-1.0),)], [&quot;features&quot;])
model.transform(test0).head().prediction
# 0.0
test1 = spark.createDataFrame([(Vectors.sparse(1, [0], [1.0]),)], [&quot;features&quot;])
model.transform(test1).head().prediction
# 1.0
dtr_path = temp_path + &quot;/dtr&quot;
dt.save(dtr_path)
dt2 = DecisionTreeRegressor.load(dtr_path)
dt2.getMaxDepth()
# 2
model_path = temp_path + &quot;/dtr_model&quot;
model.save(model_path)
model2 = DecisionTreeRegressionModel.load(model_path)
model.numNodes == model2.numNodes
# True
model.depth == model2.depth
# True
model.transform(test1).head().variance
# 0.0

Thank you! 7

4 (7 Votes)

Are there any code examples left?

Find Add Code snippet

New code examples in category Python

Python 2023-04-11 03:04:20
Python 2022-03-27 22:40:04 pycharm no module named
Python 2022-03-27 22:25:05 assign multiple variablesin one line
Python 2022-03-27 22:20:02 levenshtein distance
Python 2022-03-27 21:35:09 get text from url python last slash
Python 2022-03-27 21:30:30 df concatenate df
Python 2022-03-27 21:25:09 python odd or even
Python 2022-03-27 21:15:32 python include function from another file
Python 2022-03-27 21:10:01 color module python
Python 2022-03-27 21:00:27 python tkinter cursor types

Create a Free Account

Unlock the power of data and AI by diving into Python, ChatGPT, SQL, Power BI, and beyond.

Develop soft skills on BrainApps

Complete the IQ Test

Relative searches

decision tree

Welcome Back!

Create a Free Account