I am using Python 3.7, Windows 10, Anaconda.
The data set tree_addhealth.csv and the code are from the course Machine Learning for Data Analysis
https://www.coursera.org/learn/machine-learning-data-analysis
from pandas import Series, DataFrame
import pandas as pd
import numpy as np
import os
import matplotlib.pylab as plt
#from sklearn.cross_validation import train_test_split
from sklearn.model_selection import KFold
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import classification_report
import sklearn.metrics
# Feature Importance
from sklearn import datasets
from sklearn.ensemble import ExtraTreesClassifier
os.chdir("F:\study\machine learning\TREES")
#Load the dataset
AH_data = pd.read_csv("tree_ad